ó
    <±hôÒ  ã                   ó¬  • S SK r S SKrS SKJr  S SKJrJrJrJr  S SK	r
S SKrS SKJr  S SKJs  Jr  S SKJrJrJr  S SKJr  SSKJr  SSKJr  SS	KJr  SS
KJrJrJr  SSK J!r!J"r"  SSK#J$r$J%r%J&r&  SSK'J(r(J)r)J*r*  \\%" SS9 " S S\$5      5       5       r+\\%" SS9 " S S\$5      5       5       r,\\% " S S\$5      5       5       r- " S S\R\                  5      r/ SKS\R\                  S\R`                  S\R`                  S\R`                  S\\R`                     S\1S \14S! jjr2 " S" S#\R\                  5      r3 " S$ S%\R\                  5      r4 " S& S'\5      r5 " S( S)\R\                  5      r6 " S* S+\R\                  5      r7 " S, S-\R\                  5      r8S. r9 SLS/\R`                  S0\1S1\1S2\1S3\1S4\R`                  4S5 jjr:SMS6 jr;S7 r<S8 r= " S9 S:\R\                  5      r>\% " S; S<\"5      5       r?\%" S=S9 " S> S?\?5      5       r@ " S@ SA\R\                  5      rA\%" SBS9 " SC SD\?5      5       rB\% " SE SF\?5      5       rC\%" SGS9 " SH SI\?5      5       rD/ SJQrEg)Né    N)Ú	dataclass)ÚAnyÚCallableÚOptionalÚUnion)ÚBCEWithLogitsLossÚCrossEntropyLossÚMSELoss)Ú_calculate_fan_in_and_fan_outé   )ÚACT2FN)Ú_prepare_4d_attention_mask)ÚGradientCheckpointingLayer)ÚBaseModelOutputÚBaseModelOutputWithPoolingÚImageClassifierOutput)ÚALL_ATTENTION_FUNCTIONSÚPreTrainedModel)ÚModelOutputÚauto_docstringÚcan_return_tupleé   )ÚSiglip2ConfigÚSiglip2TextConfigÚSiglip2VisionConfigz}
    Base class for vision model's outputs that also contains image embeddings of the pooling of the last hidden states.
    )Úcustom_introc                   óÎ   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   S	rg)
ÚSiglip2VisionOutputé*   zì
image_embeds (`torch.FloatTensor` of shape `(batch_size, output_dim)` *optional* returned when model is initialized with `with_projection=True`):
    The image embeddings obtained by applying the projection layer to the pooler_output.
NÚimage_embedsÚlast_hidden_state.Úhidden_statesÚ
attentions© )Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__r    r   ÚtorchÚFloatTensorÚ__annotations__r!   r"   Útupler#   Ú__static_attributes__r$   ó    Úd/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/siglip2/modeling_siglip2.pyr   r   *   sr   ‡ ñð
 15€L(˜5×,Ñ,Ñ-Ó4Ø59Ðx × 1Ñ 1Ñ2Ó9Ø=A€M8˜E %×"3Ñ"3°SÐ"8Ñ9Ñ:ÓAØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r/   r   ze
    Base class for text model's outputs that also contains a pooling of the last hidden states.
    c                   óÎ   • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\\R                  S4      \	S'   Sr\\\R                  S4      \	S'   S	rg)
ÚSiglip2TextOutputé<   zê
text_embeds (`torch.FloatTensor` of shape `(batch_size, output_dim)` *optional* returned when model is initialized with `with_projection=True`):
    The text embeddings obtained by applying the projection layer to the pooler_output.
NÚtext_embedsr!   .r"   r#   r$   )r%   r&   r'   r(   r)   r4   r   r*   r+   r,   r!   r"   r-   r#   r.   r$   r/   r0   r2   r2   <   sr   ‡ ñð
 04€K˜%×+Ñ+Ñ,Ó3Ø59Ðx × 1Ñ 1Ñ2Ó9Ø=A€M8˜E %×"3Ñ"3°SÐ"8Ñ9Ñ:ÓAØ:>€J˜˜u×0Ñ0°#Ð5Ñ6Ñ7Ö>r/   r2   c                   ó  • \ rS rSr% SrSr\\R                     \	S'   Sr
\\R                     \	S'   Sr\\R                     \	S'   Sr\\R                     \	S'   Sr\\R                     \	S'   Sr\\	S	'   Sr\\	S
'   S\\   4S jrSrg)ÚSiglip2OutputéN   aq  
loss (`torch.FloatTensor` of shape `(1,)`, *optional*, returned when `return_loss` is `True`):
    Contrastive loss for image-text similarity.
logits_per_image (`torch.FloatTensor` of shape `(image_batch_size, text_batch_size)`):
    The scaled dot product scores between `image_embeds` and `text_embeds`. This represents the image-text
    similarity scores.
logits_per_text (`torch.FloatTensor` of shape `(text_batch_size, image_batch_size)`):
    The scaled dot product scores between `text_embeds` and `image_embeds`. This represents the text-image
    similarity scores.
text_embeds (`torch.FloatTensor` of shape `(batch_size, output_dim`):
    The text embeddings obtained by applying the projection layer to the pooled output of [`Siglip2TextModel`].
image_embeds (`torch.FloatTensor` of shape `(batch_size, output_dim`):
    The image embeddings obtained by applying the projection layer to the pooled output of [`Siglip2VisionModel`].
text_model_output (`BaseModelOutputWithPooling`):
    The output of the [`Siglip2TextModel`].
vision_model_output (`BaseModelOutputWithPooling`):
    The output of the [`Siglip2VisionModel`].
NÚlossÚlogits_per_imageÚlogits_per_textr4   r    Útext_model_outputÚvision_model_outputÚreturnc                 óJ   ^ • [        U 4S jT R                  5        5       5      $ )Nc              3   ól   >#   • U H*  nUS ;  a  TU   O[        TU5      R                  5       v •  M,     g7f))r;   r<   N)ÚgetattrÚto_tuple)Ú.0ÚkÚselfs     €r0   Ú	<genexpr>Ú)Siglip2Output.to_tuple.<locals>.<genexpr>m   s<   øé € ð 
á ð Ð LÓLˆDŠGÔRYÐZ^Ð`aÓRb×RkÑRkÓRmÔmÚ ùs   ƒ14)r-   Úkeys©rD   s   `r0   rA   ÚSiglip2Output.to_tuplel   s#   ø€ Üô 
à—Y‘Y”[ó
ó 
ð 	
r/   r$   )r%   r&   r'   r(   r)   r8   r   r*   r+   r,   r9   r:   r4   r    r;   r   r<   r-   r   rA   r.   r$   r/   r0   r6   r6   N   s›   ‡ ñð& )-€Dˆ(5×$Ñ$Ñ
%Ó,Ø48Ðh˜u×0Ñ0Ñ1Ó8Ø37€OX˜e×/Ñ/Ñ0Ó7Ø/3€K˜%×+Ñ+Ñ,Ó3Ø04€L(˜5×,Ñ,Ñ-Ó4Ø48ÐÐ1Ó8Ø6:ÐÐ3Ó:ð
˜% ™*÷ 
r/   r6   c            	       óâ   ^ • \ rS rSrS\4U 4S jjr\S\R                  S\R                  S\
S\R                  4S j5       rS	\R                  S\R                  S\R                  4S
 jrSrU =r$ )ÚSiglip2VisionEmbeddingsés   Úconfigc                 ó¾  >• [         TU ]  5         Xl        UR                  U l        UR
                  U l        [        R                  " UR                  U R
                  -  U R
                  -  U R                  S9U l	        UR                  U l
        [        U R                  S-  5      U l        [        R                  " U R                  U R                  5      U l        g )N)Úin_featuresÚout_featuresg      à?)ÚsuperÚ__init__rM   Úhidden_sizeÚ	embed_dimÚ
patch_sizeÚnnÚLinearÚnum_channelsÚpatch_embeddingÚnum_patchesÚintÚposition_embedding_sizeÚ	EmbeddingÚposition_embedding©rD   rM   Ú	__class__s     €r0   rR   Ú Siglip2VisionEmbeddings.__init__t   s¥   ø€ Ü‰ÑÔØŒØ×+Ñ+ˆŒØ ×+Ñ+ˆŒä!ŸyšyØ×+Ñ+¨d¯o©oÑ=ÀÇÁÑOØŸ™ñ 
ˆÔð
 "×-Ñ-ˆÔÜ'*¨4×+;Ñ+;¸SÑ+@Ó'AˆÔ$Ü"$§,¢,¨t×/?Ñ/?ÀÇÁÓ"PˆÕr/   Úpositional_embeddingsÚspatial_shapesÚ
max_lengthr=   c           	      óN  • UR                   S   nU R                   S   nU R                  n[        R                  " X2U4U R                  US9nU R                  SSS5      R                  S5      n U R                  R                  S:X  a  U R                  [        R                  5      n [        U5       Hn  nX   u  p‰[        R                  " U X‰4SSS	S
9n
U
R                  XHU	-  5      R                  SS5      n
U
R                  U5      n
X¦USX‰-  24'   U
S   XgX‰-  S24'   Mp     U$ )a  
Resize positional embeddings to image-specific size and pad to a fixed size.

Args:
    positional_embeddings (`torch.Tensor`):
        Position embeddings of shape (height, width, embed_dim)
    spatial_shapes (`torch.LongTensor`):
        Spatial shapes of shape (batch_size, 2) to resize the positional embeddings to
    max_length (`int`):
        Maximum length of the positional embeddings to pad resized positional embeddings to

Returns:
    `torch.Tensor`: Embeddings of shape (batch_size, max_length, embed_dim)
r   éÿÿÿÿ)ÚdeviceÚdtypeé   r   ÚcpuÚbilinearFT)ÚsizeÚmodeÚalign_cornersÚ	antialiasN)Úshaperh   r*   Úemptyrg   ÚpermuteÚ	unsqueezeÚtypeÚtoÚfloat32ÚrangeÚFÚinterpolateÚreshapeÚ	transpose)rb   rc   rd   Ú
batch_sizerT   Úsource_dtypeÚresulted_positional_embeddingsÚiÚheightÚwidthÚresized_embeddingss              r0   Úresize_positional_embeddingsÚ4Siglip2VisionEmbeddings.resize_positional_embeddingsƒ   sI  € ð( $×)Ñ)¨!Ñ,ˆ
Ø)×/Ñ/°Ñ3ˆ	Ø,×2Ñ2ˆä).¯ªØ YÐ/Ø(×/Ñ/Øñ*
Ð&ð !6× =Ñ =¸aÀÀAÓ F× PÑ PÐQRÓ SÐð !×'Ñ'×,Ñ,°Ó5Ø$9×$<Ñ$<¼U¿]¹]Ó$KÐ!äzÖ"ˆAà*Ñ-‰MˆFÜ!"§¢Ø%Ø_ØØ#Øñ"Ðð "4×!;Ñ!;¸IÐPUÁ~Ó!V×!`Ñ!`ÐabÐdeÓ!fÐð "4×!6Ñ!6°|Ó!DÐàBT¨1Ð.>°±Ð.>Ð+>Ñ?ØBTÐUVÑBWÐ*¨f©nÑ.>Ð+>Ó?ñ% #ð( .Ð-r/   Úpixel_valuesc                 ó:  • U R                   R                  R                  nU R                  UR                  US95      nU R                  R                  R                  U R                  U R                  S5      nU R                  XRUR                  S   S9nXF-   nU$ )a  
Args:
    pixel_values (`torch.FloatTensor`):
        Pixel values of shape (batch_size, max_num_patches, num_channels * patch_size * patch_size)
    spatial_shapes (`list[tuple[int, int]]`):
        Spatial shapes of shape (batch_size, 2) to resize the positional embeddings to
)rh   rf   r   )rd   )	rY   Úweightrh   ru   r^   rz   r\   rƒ   rp   )rD   r…   rc   Útarget_dtypeÚpatch_embedsrb   Úresized_positional_embeddingsÚ
embeddingss           r0   ÚforwardÚSiglip2VisionEmbeddings.forward¾   s¢   € ð ×+Ñ+×2Ñ2×8Ñ8ˆØ×+Ñ+¨L¯O©OÀ,¨OÐ,OÓPˆð !%× 7Ñ 7× >Ñ >× FÑ FØ×(Ñ(¨$×*FÑ*FÈó!
Ðð )-×(IÑ(IØ!¸l×>PÑ>PÐQRÑ>Sð )Jð )
Ð%ð
 "ÑAˆ
ØÐr/   )rM   rT   rZ   rY   rU   r^   r\   )r%   r&   r'   r(   r   rR   Ústaticmethodr*   ÚTensorÚ
LongTensorr[   rƒ   r+   rŒ   r.   Ú__classcell__©r`   s   @r0   rK   rK   s   s‹   ø† ðQÐ2÷ Qð ð8.Ø$Ÿ|™|ð8.à×(Ñ(ð8.ð ð8.ð 
‰ó	8.ó ð8.ðt E×$5Ñ$5ð Àu×GWÑGWð Ð\a×\hÑ\h÷ ò r/   rK   ÚmoduleÚqueryÚkeyÚvalueÚattention_maskÚscalingÚdropoutc                 ó°  • [         R                  " XR                  SS5      5      U-  nUb  X„-   n[        R                  R                  US[         R                  S9R                  UR                  5      n[        R                  R                  X†U R                  S9n[         R                  " Xƒ5      n	U	R                  SS5      R                  5       n	X˜4$ )Nrf   éþÿÿÿ)Údimrh   )ÚpÚtrainingr   ri   )r*   Úmatmulr{   rV   Ú
functionalÚsoftmaxrv   ru   rh   r™   rž   Ú
contiguous)
r“   r”   r•   r–   r—   r˜   r™   ÚkwargsÚattn_weightsÚattn_outputs
             r0   Úeager_attention_forwardr¦   Ø   s°   € ô —<’< §}¡}°R¸Ó'<Ó=ÀÑG€LØÑ!Ø#Ñ4ˆä—=‘=×(Ñ(¨¸2ÄUÇ]Á]Ð(ÐS×VÑVÐW\×WbÑWbÓc€LÜ—=‘=×(Ñ(¨È6Ï?É?Ð(Ð[€Lä—,’,˜|Ó3€KØ×'Ñ'¨¨1Ó-×8Ñ8Ó:€KàÐ$Ð$r/   c            
       ó®   ^ • \ rS rSrSrU 4S jr S	S\R                  S\\R                     S\	\R                  \\R                     4   4S jjr
SrU =r$ )
ÚSiglip2Attentionéï   z=Multi-headed attention from 'Attention Is All You Need' paperc                 ó   >• [         TU ]  5         Xl        UR                  U l        UR
                  U l        U R                  U R                  -  U l        U R                  U R                  -  U R                  :w  a&  [        SU R                   SU R                   S35      eU R                  S-  U l	        UR                  U l        SU l        [        R                  " U R                  U R                  5      U l        [        R                  " U R                  U R                  5      U l        [        R                  " U R                  U R                  5      U l        [        R                  " U R                  U R                  5      U l        g )Nz;embed_dim must be divisible by num_heads (got `embed_dim`: z and `num_heads`: z).ç      à¿F)rQ   rR   rM   rS   rT   Únum_attention_headsÚ	num_headsÚhead_dimÚ
ValueErrorÚscaleÚattention_dropoutr™   Ú	is_causalrV   rW   Úk_projÚv_projÚq_projÚout_projr_   s     €r0   rR   ÚSiglip2Attention.__init__ò   s  ø€ Ü‰ÑÔØŒØ×+Ñ+ˆŒØ×3Ñ3ˆŒØŸ™¨$¯.©.Ñ8ˆŒØ=‰=˜4Ÿ>™>Ñ)¨T¯^©^Ó;ÜØMÈdÏnÉnÐM]ð ^Ø—N‘NÐ# 2ð'óð ð —]‘] DÑ(ˆŒ
Ø×/Ñ/ˆŒØˆŒä—i’i §¡°·±Ó?ˆŒÜ—i’i §¡°·±Ó?ˆŒÜ—i’i §¡°·±Ó?ˆŒÜŸ	š	 $§.¡.°$·.±.ÓAˆr/   r"   r—   r=   c                 ó2  • UR                   u  pEnU R                  U5      nU R                  U5      nU R                  U5      n	UR	                  XEU R
                  U R                  5      R                  SS5      nUR	                  XEU R
                  U R                  5      R                  SS5      nU	R	                  XEU R
                  U R                  5      R                  SS5      n	[        n
U R                  R                  S:w  a  [        U R                  R                     n
U
" U UUU	UU R                  U R                  U R                  (       d  SOU R                  S9u  p¼UR!                  XEU5      R#                  5       nU R%                  U5      nX¼4$ )z#Input shape: Batch x Time x Channelr   ri   Úeagerç        )r²   r˜   r™   )rp   rµ   r³   r´   Úviewr­   r®   r{   r¦   rM   Ú_attn_implementationr   r²   r°   rž   r™   rz   r¢   r¶   )rD   r"   r—   r£   r|   Ú
seq_lengthrT   ÚqueriesrG   ÚvaluesÚattention_interfacer¥   r¤   s                r0   rŒ   ÚSiglip2Attention.forward  sS  € ð -:×,?Ñ,?Ñ)ˆ
 	à—+‘+˜mÓ,ˆØ{‰{˜=Ó)ˆØ—‘˜]Ó+ˆà—,‘,˜z°t·~±~ÀtÇ}Á}ÓU×_Ñ_Ð`aÐcdÓeˆØy‰y˜°·±ÀÇÁÓO×YÑYÐZ[Ð]^Ó_ˆØ—‘˜Z°T·^±^ÀTÇ]Á]ÓS×]Ñ]Ð^_ÐabÓcˆä(?ÐØ;‰;×+Ñ+¨wÓ6Ü"9¸$¿+¹+×:ZÑ:ZÑ"[Ðá$7ØØØØØØ—n‘nØ—J‘JØ#Ÿ}Ÿ}‘C°$·,±,ñ	%
Ñ!ˆð "×)Ñ)¨*À)ÓL×WÑWÓYˆØ—m‘m KÓ0ˆàÐ(Ð(r/   )rM   r™   rT   r®   r²   r³   r­   r¶   rµ   r°   r´   ©N)r%   r&   r'   r(   r)   rR   r*   r   r   r-   rŒ   r.   r‘   r’   s   @r0   r¨   r¨   ï   s[   ø† ÙGõBð. 26ñ$)à—|‘|ð$)ð ! §¡Ñ.ð$)ð
 
ˆu|‰|˜X e§l¡lÑ3Ð3Ñ	4÷$)ó $)r/   r¨   c                   ób   ^ • \ rS rSrU 4S jrS\R                  S\R                  4S jrSrU =r	$ )Ú
Siglip2MLPi-  c                 ó  >• [         TU ]  5         Xl        [        UR                     U l        [        R                  " UR                  UR                  5      U l
        [        R                  " UR                  UR                  5      U l        g rÂ   )rQ   rR   rM   r   Ú
hidden_actÚactivation_fnrV   rW   rS   Úintermediate_sizeÚfc1Úfc2r_   s     €r0   rR   ÚSiglip2MLP.__init__.  sb   ø€ Ü‰ÑÔØŒÜ# F×$5Ñ$5Ñ6ˆÔÜ—9’9˜V×/Ñ/°×1IÑ1IÓJˆŒÜ—9’9˜V×5Ñ5°v×7IÑ7IÓJˆr/   r"   r=   c                 ól   • U R                  U5      nU R                  U5      nU R                  U5      nU$ rÂ   )rÉ   rÇ   rÊ   )rD   r"   s     r0   rŒ   ÚSiglip2MLP.forward5  s4   € ØŸ™ Ó/ˆØ×*Ñ*¨=Ó9ˆØŸ™ Ó/ˆØÐr/   )rÇ   rM   rÉ   rÊ   )
r%   r&   r'   r(   rR   r*   r   rŒ   r.   r‘   r’   s   @r0   rÄ   rÄ   -  s)   ø† õKð U§\¡\ð °e·l±l÷ ò r/   rÄ   c            
       ó¢   ^ • \ rS rSrS\\\4   4U 4S jjr S
S\R                  S\R                  S\
\   S\\R                     4S jjrS	rU =r$ )ÚSiglip2EncoderLayeri<  rM   c                 ó<  >• [         TU ]  5         UR                  U l        [        R
                  " U R                  UR                  S9U l        [        U5      U l	        [        R
                  " U R                  UR                  S9U l
        [        U5      U l        g )N©Úeps)rQ   rR   rS   rT   rV   Ú	LayerNormÚlayer_norm_epsÚlayer_norm1r¨   Ú	self_attnÚlayer_norm2rÄ   Úmlpr_   s     €r0   rR   ÚSiglip2EncoderLayer.__init__=  sm   ø€ Ü‰ÑÔØ×+Ñ+ˆŒÜŸ<š<¨¯©¸F×<QÑ<QÑRˆÔÜ)¨&Ó1ˆŒÜŸ<š<¨¯©¸F×<QÑ<QÑRˆÔÜ˜fÓ%ˆr/   r"   r—   Úoutput_attentionsr=   c                 óÈ   • UnU R                  U5      nU R                  UUUS9u  pXA-   nUnU R                  U5      nU R                  U5      nXA-   nU4nU(       a  Xe4-  nU$ )aõ  
Args:
    hidden_states (`torch.FloatTensor`):
        Input to the layer of shape `(batch, seq_len, embed_dim)`.
    attention_mask (`torch.FloatTensor`):
        Attention mask of shape `(batch, 1, q_len, k_v_seq_len)` where padding elements are indicated by very large negative values.
    output_attentions (`bool`, *optional*, defaults to `False`):
        Whether or not to return the attentions tensors of all attention layers. See `attentions` under
        returned tensors for more detail.
)r"   r—   rÚ   )rÕ   rÖ   r×   rØ   )rD   r"   r—   rÚ   Úresidualr¤   Úoutputss          r0   rŒ   ÚSiglip2EncoderLayer.forwardE  s‡   € ð  !ˆà×(Ñ(¨Ó7ˆØ&*§n¡nØ'Ø)Ø/ð '5ð '
Ñ#ˆð
 !Ñ0ˆà ˆØ×(Ñ(¨Ó7ˆØŸ™ Ó/ˆØ Ñ0ˆà Ð"ˆæØÑ&ˆGàˆr/   )rT   rÕ   r×   rØ   rÖ   )F)r%   r&   r'   r(   r   r   r   rR   r*   r   r   Úboolr-   r+   rŒ   r.   r‘   r’   s   @r0   rÏ   rÏ   <  sg   ø† ð&˜uÐ%8Ð:KÐ%KÑL÷ &ð -2ñ	$à—|‘|ð$ð Ÿ™ð$ð $ D™>ð	$ð
 
ˆu× Ñ Ñ	!÷$ó $r/   rÏ   c            
       óˆ   ^ • \ rS rSrSrS\4U 4S jjr\   SS\\	R                     S\\   S\\   S\4S	 jj5       rS
rU =r$ )ÚSiglip2Encoderil  zŸ
Transformer encoder consisting of `config.num_hidden_layers` self attention layers. Each layer is a
[`Siglip2EncoderLayer`].

Args:
    config: Siglip2Config
rM   c                 óÔ   >• [         TU ]  5         Xl        [        R                  " [        UR                  5       Vs/ sH  n[        U5      PM     sn5      U l        SU l	        g s  snf )NF)
rQ   rR   rM   rV   Ú
ModuleListrw   Únum_hidden_layersrÏ   ÚlayersÚgradient_checkpointing)rD   rM   Ú_r`   s      €r0   rR   ÚSiglip2Encoder.__init__u  sT   ø€ Ü‰ÑÔØŒÜ—m’mÌ%ÐPV×PhÑPhÔJiÓ$jÑJiÀQÔ%8¸Ö%@ÑJiÑ$jÓkˆŒØ&+ˆÕ#ùò %ks   ½A%r—   rÚ   Úoutput_hidden_statesr=   c                 óF  • Ub  UOU R                   R                  nUb  UOU R                   R                  nU(       a  SOSnU(       a  SOSnUnU R                   H-  nU(       a  XW4-   nU" UUUS9n	U	S   nU(       d  M%  XiS   4-   nM/     U(       a  XW4-   n[	        UUUS9$ )aÌ  
Args:
    inputs_embeds (`torch.FloatTensor` of shape `(batch_size, sequence_length, hidden_size)`):
        Optionally, instead of passing `input_ids` you can choose to directly pass an embedded representation.
        This is useful if you want more control over how to convert `input_ids` indices into associated vectors
        than the model's internal embedding lookup matrix.
    attention_mask (`torch.Tensor` of shape `(batch_size, sequence_length)`, *optional*):
        Mask to avoid performing attention on padding token indices. Mask values selected in `[0, 1]`:

        - 1 for tokens that are **not masked**,
        - 0 for tokens that are **masked**.

        [What are attention masks?](../glossary#attention-mask)
    output_attentions (`bool`, *optional*):
        Whether or not to return the attentions tensors of all attention layers. See `attentions` under
        returned tensors for more detail.
    output_hidden_states (`bool`, *optional*):
        Whether or not to return the hidden states of all layers. See `hidden_states` under returned tensors
        for more detail.
    return_dict (`bool`, *optional*):
        Whether or not to return a [`~utils.ModelOutput`] instead of a plain tuple.
Nr$   )rÚ   r   r   )r!   r"   r#   )rM   rÚ   ré   rå   r   )
rD   Úinputs_embedsr—   rÚ   ré   Úencoder_statesÚall_attentionsr"   Úencoder_layerÚlayer_outputss
             r0   rŒ   ÚSiglip2Encoder.forward|  sÊ   € ð< 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ö  4™¸ˆÞ0™°dˆà%ˆØ!Ÿ[œ[ˆMÞ#Ø!/Ð2BÑ!Bá)ØØØ"3ñˆMð *¨!Ñ,ˆMç Ð Ø!/ÀÑ3CÐ2EÑ!E’ñ )ö  Ø+Ð.>Ñ>ˆNäØ+Ø(Ø%ñ
ð 	
r/   )rM   ræ   rå   ©NNN)r%   r&   r'   r(   r)   r   rR   r   r   r*   r   rß   r   rŒ   r.   r‘   r’   s   @r0   rá   rá   l  sl   ø† ñð,˜}÷ ,ð ð 26Ø,0Ø/3ñ<
ð ! §¡Ñ.ð<
ð $ D™>ð	<
ð
 ' t™nð<
ð 
ô<
ó ö<
r/   rá   c                   ó¶   ^ • \ rS rSrS\4U 4S jjr\\  SS\R                  S\R                  S\R                  S\\   S\\   S	\4S
 jj5       5       rSrU =r$ )ÚSiglip2VisionTransformeri¼  rM   c                 ó~  >• [         TU ]  5         Xl        UR                  n[	        U5      U l        [        U5      U l        [        R                  " X!R                  S9U l        [        US5      (       d  SOUR                  U l        U R                  (       a  [        U5      U l        UR"                  S:H  U l        g )NrÑ   Úvision_use_headTÚflash_attention_2)rQ   rR   rM   rS   rK   r‹   rá   ÚencoderrV   rÓ   rÔ   Úpost_layernormÚhasattrrõ   Úuse_headÚ$Siglip2MultiheadAttentionPoolingHeadÚheadr¼   Ú_use_flash_attention_2©rD   rM   rT   r`   s      €r0   rR   Ú!Siglip2VisionTransformer.__init__½  s   ø€ Ü‰ÑÔØŒØ×&Ñ&ˆ	ä1°&Ó9ˆŒÜ% fÓ-ˆŒÜ Ÿlšl¨9×:OÑ:OÑPˆÔÜ$+¨FÐ4E×$FÑ$F™ÈF×LbÑLbˆŒØ==Ü<¸VÓDˆDŒIØ&,×&AÑ&AÐEXÑ&XˆÕ#r/   r…   r—   rc   rÚ   ré   r=   c                 óÎ  • Ub  UOU R                   R                  nUb  UOU R                   R                  nU R                  X5      nUb'  U R                  (       d  [        X&R                  5      nOUnU R                  UUUUS9nUR                  n	U R                  U	5      n	U R                  (       a  U R                  X’5      OSn
[        U	U
UR                  UR                  S9$ )z“
spatial_shapes (`torch.LongTensor` of shape `(batch_size, 2)`):
    Tensor containing the spatial dimensions (height, width) of the input images.
N©rë   r—   rÚ   ré   ©r!   Úpooler_outputr"   r#   )rM   rÚ   ré   r‹   rý   r   rh   r÷   r!   rø   rú   rü   r   r"   r#   )rD   r…   r—   rc   rÚ   ré   r"   Úencoder_attention_maskÚencoder_outputsr!   r  s              r0   rŒ   Ú Siglip2VisionTransformer.forwardÊ  së   € ð 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð Ÿ™¨ÓEˆàÑ%¨d×.I×.Iä%?À×PcÑPcÓ%dÑ"à%3Ð"à+/¯<©<Ø'Ø1Ø/Ø!5ð	 ,8ð ,
ˆð ,×=Ñ=ÐØ ×/Ñ/Ð0AÓBÐàHLÏÏ˜Ÿ	™	Ð"3ÔDÐ[_ˆä)Ø/Ø'Ø)×7Ñ7Ø&×1Ñ1ñ	
ð 	
r/   )rý   rM   r‹   r÷   rü   rø   rú   ©NN)r%   r&   r'   r(   r   rR   r   r   r*   r+   r   r   r   rß   r   rŒ   r.   r‘   r’   s   @r0   ró   ró   ¼  sˆ   ø† ðYÐ2÷ Yð Øð -1Ø/3ñ*
à×'Ñ'ð*
ð Ÿ™ð*
ð ×(Ñ(ð	*
ð
 $ D™>ð*
ð ' t™nð*
ð 
$ô*
ó ó ö*
r/   ró   c            	       ó¶   ^ • \ rS rSrS\4U 4S jjr   S
S\\R                     S\\R                     S\\R                     S\R                  4S jjrS	rU =r$ )ÚSiglip2TextEmbeddingsiù  rM   c                 óN  >• [         TU ]  5         UR                  n[        R                  " UR
                  U5      U l        [        R                  " UR                  U5      U l        U R                  S[        R                  " UR                  5      R                  S5      SS9  g )NÚposition_ids)r   rf   F)Ú
persistent)rQ   rR   rS   rV   r]   Ú
vocab_sizeÚtoken_embeddingÚmax_position_embeddingsr^   Úregister_bufferr*   ÚarangeÚexpandrþ   s      €r0   rR   ÚSiglip2TextEmbeddings.__init__ú  sƒ   ø€ Ü‰ÑÔØ×&Ñ&ˆ	ä!Ÿ|š|¨F×,=Ñ,=¸yÓIˆÔÜ"$§,¢,¨v×/MÑ/MÈyÓ"YˆÔð 	×ÑØœEŸLšL¨×)GÑ)GÓH×OÑOÐPWÓXÐejð 	ò 	
r/   Ú	input_idsr  rë   r=   c                 ó<  • Ub  UR                   S   OUR                   S   nU R                  R                  R                   S   nXE:”  a  [        SU SU 35      eUc  U R                  S S 2S U24   nUc  U R                  U5      nU R                  U5      nX6-   nU$ )Nrf   r›   r   zRSequence length must be less than max_position_embeddings (got `sequence length`: z and max_position_embeddings: )rp   r^   r‡   r¯   r  r  )rD   r  r  rë   r½   Úmax_position_embeddingÚposition_embeddingsr‹   s           r0   rŒ   ÚSiglip2TextEmbeddings.forward  sÁ   € ð -6Ñ,AY—_‘_ RÒ(À}×GZÑGZÐ[]ÑG^ˆ
Ø!%×!8Ñ!8×!?Ñ!?×!EÑ!EÀaÑ!HÐàÓ.ÜØdØ,Ð<Ð=SÐ<TðVóð ð
 ÑØ×,Ñ,ªQ°°°¨^Ñ<ˆLàÑ Ø ×0Ñ0°Ó;ˆMà"×5Ñ5°lÓCÐØ"Ñ8ˆ
àÐr/   )r^   r  rñ   )r%   r&   r'   r(   r   rR   r   r*   r   r+   r   rŒ   r.   r‘   r’   s   @r0   r	  r	  ù  sp   ø† ð

Ð0÷ 

ð 15Ø37Ø59ñ	à˜E×,Ñ,Ñ-ðð ˜u×/Ñ/Ñ0ðð   × 1Ñ 1Ñ2ð	ð
 
‰÷ó r/   r	  c                 ó€  • S nXSU-  -
  :  d  XSU-  -   :”  a  [         R                  " SSS9  U" X1-
  U-  5      nU" XA-
  U-  5      nU R                  SU-  S-
  SU-  S-
  5        U R                  5         U R	                  U[
        R                  " S5      -  5        U R                  U5        U R                  X4S9  g )Nc                 óh   • S[         R                  " U [         R                  " S5      -  5      -   S-  $ )Nç      ð?ç       @)ÚmathÚerfÚsqrt)Úxs    r0   Únorm_cdfÚ _trunc_normal_.<locals>.norm_cdf$  s(   € à”d—h’h˜q¤4§9¢9¨S£>Ñ1Ó2Ñ2°cÑ9Ð9r/   ri   zjmean is more than 2 std from [a, b] in nn.init.trunc_normal_. The distribution of values may be incorrect.)Ú
stacklevelr   r  )ÚminÚmax)	ÚwarningsÚwarnÚuniform_Úerfinv_Úmul_r  r  Úadd_Úclamp_)ÚtensorÚmeanÚstdÚaÚbr!  ÚlÚus           r0   Ú_trunc_normal_r4  !  s¿   € ò:ð 	1s‘7‰{Ó ¨1¨s©7¡{Ó 2ÜŠð;àò	
ñ 	!‘(˜cÑ!Ó"€AÙ!‘(˜cÑ!Ó"€Að ‡OOA˜‘E˜A‘I˜q 1™u q™yÔ)ð ‡NNÔð ‡KK”d—i’i “nÑ$Ô%Ø
‡KKÔð ‡MMa€MÒr/   r-  r.  r/  r0  r1  r=   c                 ó¾   • [         R                  " 5          [        U SSX45        U R                  U5      R	                  U5        SSS5        g! , (       d  f       g= f)a=  Fills the input Tensor with values drawn from a truncated
normal distribution. The values are effectively drawn from the
normal distribution :math:`\mathcal{N}(     ext{mean},      ext{std}^2)`
with values outside :math:`[a, b]` redrawn until they are within
the bounds. The method used for generating the random values works
best when :math:`a \leq     ext{mean} \leq b`.

NOTE: this 'tf' variant behaves closer to Tensorflow / JAX impl where the
bounds [a, b] are applied when sampling the normal distribution with mean=0, std=1.0
and the result is subsequently scaled and shifted by the mean and std args.

Args:
    tensor: an n-dimensional `torch.Tensor`
    mean: the mean of the normal distribution
    std: the standard deviation of the normal distribution
    a: the minimum cutoff value
    b: the maximum cutoff value
r   r  N)r*   Úno_gradr4  r*  r+  )r-  r.  r/  r0  r1  s        r0   Útrunc_normal_tf_r7  E  s<   € ô* 
ŠÜv˜q # qÔ,Ø‰CÓ×Ñ˜dÔ#÷ 
Žús   –/AÁ
Ac                 óF  • [        U 5      u  pEUS:X  a  UnOUS:X  a  UnOUS:X  a  XE-   S-  nUW-  nUS:X  a"  [        U [        R                  " U5      S-  S9  g US:X  aB  [        R
                  " 5          U R                  [        R                  " U5      S9  S S S 5        g US	:X  aK  [        R                  " S
U-  5      n[        R
                  " 5          U R                  U* U5        S S S 5        g [        SU 35      e! , (       d  f       g = f! , (       d  f       g = f)NÚfan_inÚfan_outÚfan_avgri   Útruncated_normalg©Û¶ä%ì?©r/  ÚnormalÚuniformr   zinvalid distribution )	r   r7  r  r  r*   r6  Únormal_r(  r¯   )	r-  r°   rm   Údistributionr9  r:  ÚdenomÚvarianceÚbounds	            r0   Úvariance_scaling_rE  _  sö   € Ü3°FÓ;O€FØˆxÓØ‰Ø	Ó	Ø‰Ø	Ó	ØÑ! QÑ&ˆàu‰}€HàÐ)Ó)ä˜¤T§Y¢Y¨xÓ%8Ð;NÑ%NÓOØ	˜Ó	!Ü]Š]_ØN‰NœtŸyšy¨Ó2ˆNÑ3÷ ˆ_à	˜Ó	"Ü—	’	˜!˜h™,Ó'ˆÜ]Š]_ØO‰O˜U˜F EÔ*÷ ˆ_ô Ð0°°Ð?Ó@Ð@÷ _ú÷ _ús   Á5$DÃDÄ
DÄ
D c                 ó   • [        U SSS9  g )Nr9  r<  ©rm   rA  ©rE  ©r-  s    r0   Úlecun_normal_rJ  x  s   € Üf 8Ð:LÓMr/   c                 ó   • [        U SSS9  g )Nr9  r>  rG  rH  rI  s    r0   Údefault_flax_embed_initrL  |  s   € Üf 8¸(ÓCr/   c                   óÎ   ^ • \ rS rSrS\4U 4S jjr\\     SS\\	R                     S\\	R                     S\\	R                     S\\   S\\   S	\4S
 jj5       5       rSrU =r$ )ÚSiglip2TextTransformeri€  rM   c                 ó>  >• [         TU ]  5         Xl        UR                  n[	        U5      U l        [        U5      U l        [        R                  " X!R                  S9U l        [        R                  " X!R                  5      U l        UR                  S:H  U l        g )NrÑ   rö   )rQ   rR   rM   rS   r	  r‹   rá   r÷   rV   rÓ   rÔ   Úfinal_layer_normrW   Úprojection_sizerü   r¼   rý   rþ   s      €r0   rR   ÚSiglip2TextTransformer.__init__  sw   ø€ Ü‰ÑÔØŒØ×&Ñ&ˆ	Ü/°Ó7ˆŒÜ% fÓ-ˆŒÜ "§¢¨Y×<QÑ<QÑ RˆÔä—I’I˜i×)?Ñ)?Ó@ˆŒ	Ø&,×&AÑ&AÐEXÑ&XˆÕ#r/   r  r—   r  rÚ   ré   r=   c                 ó  • Ub  UOU R                   R                  nUb  UOU R                   R                  nUc  [        S5      eUR	                  5       nUR                  SUS   5      nU R                  XS9nUb&  U R                  (       d  [        X'R                  5      nU R                  UUUUS9nUR                  n	U R                  U	5      n	U	S S 2SS S 24   n
U R                  U
5      n
[        U	U
UR                  UR                   S9$ )NzYou have to specify input_idsrf   )r  r  r  r  )rM   rÚ   ré   r¯   rl   r»   r‹   rý   r   rh   r÷   r!   rP  rü   r   r"   r#   )rD   r  r—   r  rÚ   ré   Úinput_shaper"   r  r!   Úpooled_outputs              r0   rŒ   ÚSiglip2TextTransformer.forwardŒ  s"  € ð 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð ÑÜÐ<Ó=Ð=à—n‘nÓ&ˆØ—N‘N 2 {°2¡Ó7ˆ	àŸ™°)˜ÐWˆð Ñ%¨d×.I×.Iä7¸×H[ÑH[Ó\ˆNà+/¯<©<Ø'Ø)Ø/Ø!5ð	 ,8ð ,
ˆð ,×=Ñ=ÐØ ×1Ñ1Ð2CÓDÐð *ª!¨R²¨(Ñ3ˆØŸ	™	 -Ó0ˆä)Ø/Ø'Ø)×7Ñ7Ø&×1Ñ1ñ	
ð 	
r/   )rý   rM   r‹   r÷   rP  rü   ©NNNNN)r%   r&   r'   r(   r   rR   r   r   r   r*   r   rß   r   rŒ   r.   r‘   r’   s   @r0   rN  rN  €  sœ   ø† ð	YÐ0÷ 	Yð Øð -1Ø15Ø/3Ø,0Ø/3ñ.
à˜EŸL™LÑ)ð.
ð ! §¡Ñ.ð.
ð ˜uŸ|™|Ñ,ð	.
ð
 $ D™>ð.
ð ' t™nð.
ð 
$ô.
ó ó ö.
r/   rN  c                   óF   • \ rS rSr% \\S'   SrSr/ SQrSr	Sr
SrSrS rSrg)	ÚSiglip2PreTrainedModeli¿  rM   Úsiglip2T)r	  rK   rÏ   rû   c                 óV  • [        U[        5      (       aŸ  [        U R                  [        5      (       a   U R                  R                  R
                  OU R                  R
                  n[        R                  R                  UR                  R                  S[        R                  " U5      -  S9  g[        U[        R                  5      (       a  [        UR                  5        g[        U[        5      (       Ga™  [        R                  R!                  UR"                  R                  5        [        R                  R!                  UR$                  R                  5        [        R                  R!                  UR&                  R                  5        [        R                  R!                  UR(                  R                  5        [        R                  R+                  UR"                  R,                  5        [        R                  R+                  UR$                  R,                  5        [        R                  R+                  UR&                  R,                  5        [        R                  R+                  UR(                  R,                  5        g[        U[.        5      (       aË  [        R                  R!                  UR0                  R                  5        [        R                  R!                  UR2                  R                  5        [        R                  R                  UR0                  R,                  SS9  [        R                  R                  UR2                  R,                  SS9  g[        U[4        5      (       a®  [        R                  R!                  UR6                  R8                  5        [        R                  R!                  UR:                  R<                  R8                  5        [        R                  R+                  UR:                  R>                  R8                  5        g[        U[@        5      (       at  [B        RD                  " [B        RF                  " S5      5      nURH                  R8                  RK                  U5        URL                  R8                  RO                  5         g[        U[P        5      (       ak  [        R                  R                  URR                  R                  U R                  R                  R
                  S-  U R                  RT                  -  S9  g[        U[        RV                  [        RX                  45      (       aM  [[        UR                  5        UR,                  b*  [        R                  R+                  UR,                  5        gg[        U[        R\                  5      (       aJ  UR,                  R8                  RO                  5         UR                  R8                  RK                  S5        gg)zInitialize the weightsr   r=  gíµ ÷Æ°>r  r«   N)/Ú
isinstancerK   rM   r   Úvision_configrS   rV   Úinitr@  r^   r‡   Únpr  r]   rL  r¨   Úxavier_uniform_rµ   r³   r´   r¶   Úzeros_ÚbiasrÄ   rÉ   rÊ   rû   ÚprobeÚdataÚ	attentionÚin_proj_weightÚin_proj_biasÚSiglip2Modelr*   Úlogr-  Úlogit_scaleÚfill_Ú
logit_biasÚzero_ÚSiglip2ForImageClassificationÚ
classifierÚinitializer_factorrW   ÚConv2drJ  rÓ   )rD   r“   r   Úlogit_scale_inits       r0   Ú_init_weightsÚ$Siglip2PreTrainedModel._init_weightsÐ  s©  € äfÔ5×6Ñ6ô ˜dŸk™k¬=×9Ñ9ð —‘×)Ñ)×5Ò5à—[‘[×,Ñ,ð ô
 G‰GO‰O˜F×5Ñ5×<Ñ<À!ÄbÇgÂgÈeÃnÑBTˆOÒUÜ˜¤§¡×-Ñ-Ü# F§M¡MÕ2Ü˜Ô 0×1Ò1ÜG‰G×#Ñ# F§M¡M×$8Ñ$8Ô9ÜG‰G×#Ñ# F§M¡M×$8Ñ$8Ô9ÜG‰G×#Ñ# F§M¡M×$8Ñ$8Ô9ÜG‰G×#Ñ# F§O¡O×$:Ñ$:Ô;ÜG‰GN‰N˜6Ÿ=™=×-Ñ-Ô.ÜG‰GN‰N˜6Ÿ=™=×-Ñ-Ô.ÜG‰GN‰N˜6Ÿ=™=×-Ñ-Ô.ÜG‰GN‰N˜6Ÿ?™?×/Ñ/Õ0Ü˜¤
×+Ñ+ÜG‰G×#Ñ# F§J¡J×$5Ñ$5Ô6ÜG‰G×#Ñ# F§J¡J×$5Ñ$5Ô6ÜG‰GO‰O˜FŸJ™JŸO™O°ˆOÑ6ÜG‰GO‰O˜FŸJ™JŸO™O°ˆOÒ6Ü˜Ô D×EÑEÜG‰G×#Ñ# F§L¡L×$5Ñ$5Ô6ÜG‰G×#Ñ# F×$4Ñ$4×$CÑ$C×$HÑ$HÔIÜG‰GN‰N˜6×+Ñ+×8Ñ8×=Ñ=Õ>Ü˜¤×-Ñ-Ü$Ÿyšy¬¯ª°cÓ):Ó;ÐØ×Ñ×#Ñ#×)Ñ)Ð*:Ô;Ø×Ñ×"Ñ"×(Ñ(Õ*Ü˜Ô =×>Ñ>ÜG‰GO‰OØ×!Ñ!×(Ñ(Ø—K‘K×-Ñ-×9Ñ9¸4Ñ?À$Ç+Á+×B`ÑB`Ñ`ð ò ô ˜¤§¡¬B¯I©IÐ 6×7Ñ7Ü˜&Ÿ-™-Ô(Ø{‰{Ñ&Ü—‘—‘˜vŸ{™{Õ+ð 'ä˜¤§¡×-Ñ-ØK‰K×Ñ×"Ñ"Ô$ØM‰M×Ñ×$Ñ$ SÕ)ð .r/   r$   N)r%   r&   r'   r(   r   r,   Úbase_model_prefixÚsupports_gradient_checkpointingÚ_no_split_modulesÚ_supports_flash_attnÚ_supports_sdpaÚ_supports_flex_attnÚ_supports_attention_backendrs  r.   r$   r/   r0   rY  rY  ¿  s:   ‡ àÓØ!ÐØ&*Ð#òÐð  ÐØ€NØÐØ"&Ðõ,*r/   rY  zL
    The text model from Siglip2 without any head or projection on top.
    c                   ó  ^ • \ rS rSr% \\S'   S\4U 4S jjrS\R                  4S jr	S r
\\     SS\\R                     S\\R                     S	\\R                     S
\\   S\\   S\4S jj5       5       rSrU =r$ )ÚSiglip2TextModeliÿ  rM   c                 ód   >• [         TU ]  U5        [        U5      U l        U R	                  5         g rÂ   )rQ   rR   rN  Ú
text_modelÚ	post_initr_   s     €r0   rR   ÚSiglip2TextModel.__init__  s&   ø€ Ü‰Ñ˜Ô Ü0°Ó8ˆŒà‰Õr/   r=   c                 óB   • U R                   R                  R                  $ rÂ   ©r  r‹   r  rH   s    r0   Úget_input_embeddingsÚ%Siglip2TextModel.get_input_embeddings  s   € Ø‰×)Ñ)×9Ñ9Ð9r/   c                 ó8   • XR                   R                  l        g rÂ   rƒ  )rD   r–   s     r0   Úset_input_embeddingsÚ%Siglip2TextModel.set_input_embeddings  s   € Ø5:‰×"Ñ"Õ2r/   r  r—   r  rÚ   ré   c                 ó(   • U R                  UUUUUS9$ )aX  
Examples:

```python
>>> from transformers import AutoTokenizer, Siglip2TextModel

>>> model = Siglip2TextModel.from_pretrained("google/siglip2-base-patch16-224")
>>> tokenizer = AutoTokenizer.from_pretrained("google/siglip2-base-patch16-224")

>>> # important: make sure to set padding="max_length" as that's how the model was trained
>>> inputs = tokenizer(["a photo of a cat", "a photo of a dog"], padding="max_length", return_tensors="pt")

>>> outputs = model(**inputs)
>>> last_hidden_state = outputs.last_hidden_state
>>> pooled_output = outputs.pooler_output  # pooled (EOS token) states
```©r  r—   r  rÚ   ré   ©r  )rD   r  r—   r  rÚ   ré   s         r0   rŒ   ÚSiglip2TextModel.forward  s)   € ð6 ‰ØØ)Ø%Ø/Ø!5ð ð 
ð 	
r/   r‹  rW  )r%   r&   r'   r(   r   r,   rR   rV   ÚModuler„  r‡  r   r   r   r*   r   rß   r   rŒ   r.   r‘   r’   s   @r0   r}  r}  ÿ  s·   ø‡ ð ÓðÐ0÷ ð: b§i¡iô :ò;ð Øð -1Ø15Ø/3Ø,0Ø/3ñ
à˜EŸL™LÑ)ð
ð ! §¡Ñ.ð
ð ˜uŸ|™|Ñ,ð	
ð
 $ D™>ð
ð ' t™nð
ð 
$ô
ó ó ö
r/   r}  c                   ó   ^ • \ rS rSrSrS\4U 4S jjrS
S\R                  S\	\R                     S\R                  4S jjr
S	rU =r$ )rû   i7  zMultihead Attention Pooling.rM   c                 ó¦  >• [         TU ]  5         [        R                  " [        R
                  " SSUR                  5      5      U l        [        R                  R                  UR                  UR                  SS9U l
        [        R                  " UR                  UR                  S9U l        [        U5      U l        UR                  U l        g )Nr   T)Úbatch_firstrÑ   )rQ   rR   rV   Ú	Parameterr*   ÚrandnrS   rc  ÚMultiheadAttentionr¬   re  rÓ   rÔ   Ú	layernormrÄ   rØ   r­   r_   s     €r0   rR   Ú-Siglip2MultiheadAttentionPoolingHead.__init__:  s’   ø€ Ü‰ÑÔä—\’\¤%§+¢+¨a°°F×4FÑ4FÓ"GÓHˆŒ
ÜŸ™×4Ñ4°V×5GÑ5GÈ×IcÑIcÐquÐ4ÐvˆŒÜŸš f×&8Ñ&8¸f×>SÑ>SÑTˆŒÜ˜fÓ%ˆŒØ×3Ñ3ˆr/   Úhidden_stater—   r=   c                 óª  • UR                   S   nU R                  R                  USS5      nUbc  UR                   S   UR                   S   pe[        X!R                  U5      nUR                  SU R
                  US5      nUR                  SXV5      nU R                  XAXS9S   nUnU R                  U5      nXpR                  U5      -   nUS S 2S4   $ )Nr   r   rf   )Ú	attn_mask)
rp   rc  Úrepeatr   rh   r­   rz   re  r”  rØ   )rD   r–  r—   r|   rc  Ú
target_lenÚ
source_lenrÜ   s           r0   rŒ   Ú,Siglip2MultiheadAttentionPoolingHead.forwardC  sÕ   € Ø!×'Ñ'¨Ñ*ˆ
Ø—
‘
×!Ñ! *¨a°Ó3ˆàÑ%Ø%*§[¡[°¡^°\×5GÑ5GÈÑ5J˜
Ü7¸×HZÑHZÐ\fÓgˆNØ+×2Ñ2°1°d·n±nÀjÐRSÓTˆNØ+×3Ñ3°B¸
ÓOˆNà—~‘~ e¸<~ÐbÐcdÑeˆàˆØ—~‘~ lÓ3ˆØ§(¡(¨<Ó"8Ñ8ˆàšA˜q˜DÑ!Ð!r/   )re  r”  rØ   r­   rc  rÂ   )r%   r&   r'   r(   r)   r   rR   r*   r   r   rŒ   r.   r‘   r’   s   @r0   rû   rû   7  sF   ø† Ù&ð4Ð2÷ 4ñ" E§L¡Lð "À(È5Ï<É<ÑBXð "Ðdi×dpÑdp÷ "ó "r/   rû   zN
    The vision model from Siglip2 without any head or projection on top.
    c                   óè   ^ • \ rS rSr% \\S'   SrS\4U 4S jjrS\R                  4S jr
\\  SS\R                  S\R                  S\R                   S	\\   S
\\   S\4S jj5       5       rSrU =r$ )ÚSiglip2VisionModeliV  rM   r…   c                 ód   >• [         TU ]  U5        [        U5      U l        U R	                  5         g rÂ   )rQ   rR   ró   Úvision_modelr€  r_   s     €r0   rR   ÚSiglip2VisionModel.__init___  s)   ø€ Ü‰Ñ˜Ô ä4°VÓ<ˆÔð 	‰Õr/   r=   c                 óB   • U R                   R                  R                  $ rÂ   )r   r‹   rY   rH   s    r0   r„  Ú'Siglip2VisionModel.get_input_embeddingsg  s   € Ø× Ñ ×+Ñ+×;Ñ;Ð;r/   Úpixel_attention_maskrc   rÚ   ré   c                 ó(   • U R                  UUUUUS9$ )a©  
pixel_attention_mask (`torch.Tensor` of shape `(batch_size, image_size, image_size)`, *optional*):
    Mask to avoid performing attention on padding pixel indices.
spatial_shapes (`torch.LongTensor` of shape `(batch_size, 2)`):
    Tensor containing the spatial dimensions (height, width) of the input images.

Examples:

```python
>>> from PIL import Image
>>> import requests
>>> from transformers import AutoProcessor, Siglip2VisionModel

>>> model = Siglip2VisionModel.from_pretrained("google/siglip2-base-patch16-224")
>>> processor = AutoProcessor.from_pretrained("google/siglip2-base-patch16-224")

>>> url = "http://images.cocodataset.org/val2017/000000039769.jpg"
>>> image = Image.open(requests.get(url, stream=True).raw)

>>> inputs = processor(images=image, return_tensors="pt")

>>> outputs = model(**inputs)
>>> last_hidden_state = outputs.last_hidden_state
>>> pooled_output = outputs.pooler_output  # pooled features
```©r…   r—   rc   rÚ   ré   ©r   )rD   r…   r¤  rc   rÚ   ré   s         r0   rŒ   ÚSiglip2VisionModel.forwardj  s,   € ðF × Ñ Ø%Ø/Ø)Ø/Ø!5ð !ð 
ð 	
r/   r§  r  )r%   r&   r'   r(   r   r,   Úmain_input_namerR   rV   r  r„  r   r   r*   r+   r   r   r   rß   r   rŒ   r.   r‘   r’   s   @r0   rž  rž  V  s£   ø‡ ð  ÓØ$€OðÐ2÷ ð< b§i¡iô <ð Øð -1Ø/3ñ'
à×'Ñ'ð'
ð $Ÿl™lð'
ð ×(Ñ(ð	'
ð
 $ D™>ð'
ð ' t™nð'
ð 
$ô'
ó ó ö'
r/   rž  c                   ó–  ^ • \ rS rSr% \\S'   S\4U 4S jjr\     SS\\	R                     S\\	R                     S\\	R                     S\\   S\\   S	\	R                  4S
 jj5       r\     SS\\	R                     S\\	R                     S\\	R                     S\\   S\\   S	\	R                  4S jj5       r\\         SS\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\	R                     S\\   S\\   S\\   S	\4S jj5       5       rSrU =r$ )rh  i–  rM   c                 óÌ  >• [         TU ]  U5        [        UR                  [        5      (       d"  [        S[        UR                  5       S35      e[        UR                  [        5      (       d"  [        S[        UR                  5       S35      eUR                  nUR                  n[        R                  U5      n[        R                  U5      nUR                  U l        UR                  U l        [        R                  " [         R"                  " S5      5      U l        [        R                  " [         R"                  " S5      5      U l        U R)                  5         g )NzNconfig.text_config is expected to be of type Siglip2TextConfig but is of type Ú.zRconfig.vision_config is expected to be of type Siglip2VisionConfig but is of type r   )rQ   rR   r\  Útext_configr   Ú	TypeErrorrt   r]  r   r}  Ú_from_configrž  r  r   rV   r‘  r*   r’  rj  rl  r€  )rD   rM   r­  r]  r  r   r`   s         €r0   rR   ÚSiglip2Model.__init__š  s"  ø€ Ü‰Ñ˜Ô ä˜&×,Ñ,Ô.?×@Ñ@ÜðÜ˜×+Ñ+Ó,Ð-¨Qð0óð ô
 ˜&×.Ñ.Ô0C×DÑDÜðÜ˜×-Ñ-Ó.Ð/¨qð2óð ð
 ×(Ñ(ˆØ×,Ñ,ˆô &×2Ñ2°;Ó?ˆ
Ü)×6Ñ6°}ÓEˆð %×/Ñ/ˆŒØ(×5Ñ5ˆÔäŸ<š<¬¯ª°A«Ó7ˆÔÜŸ,š,¤u§{¢{°1£~Ó6ˆŒð 	‰Õr/   r  r—   r  rÚ   ré   r=   c                 ó°   • Ub  UOU R                   R                  nUb  UOU R                   R                  nU R                  UUUUUS9nUR                  nU$ )aÝ  
Returns:
    text_features (`torch.FloatTensor` of shape `(batch_size, output_dim`): The text embeddings obtained by
    applying the projection layer to the pooled output of [`Siglip2TextModel`].

Examples:

```python
>>> from transformers import AutoTokenizer, AutoModel
>>> import torch

>>> model = AutoModel.from_pretrained("google/siglip2-base-patch16-224")
>>> tokenizer = AutoTokenizer.from_pretrained("google/siglip2-base-patch16-224")

>>> # important: make sure to set padding="max_length" as that's how the model was trained
>>> inputs = tokenizer(["a photo of a cat", "a photo of a dog"], padding="max_length", return_tensors="pt")
>>> with torch.no_grad():
...     text_features = model.get_text_features(**inputs)
```rŠ  )rM   rÚ   ré   r  r  )rD   r  r—   r  rÚ   ré   Útext_outputsrU  s           r0   Úget_text_featuresÚSiglip2Model.get_text_featuresº  sr   € ð: 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð 48·?±?ØØ)Ø%Ø/Ø!5ð 4Cð 4
ˆð %×2Ñ2ˆàÐr/   r…   r¤  rc   c                 ó°   • Ub  UOU R                   R                  nUb  UOU R                   R                  nU R                  UUUUUS9nUR                  nU$ )a<  
pixel_attention_mask (`torch.Tensor` of shape `(batch_size, image_size, image_size)`, *optional*):
    Mask to avoid performing attention on padding pixel indices.
spatial_shapes (`torch.LongTensor` of shape `(batch_size, 2)`):
    Tensor containing the spatial dimensions (height, width) of the input images.

Returns:
    image_features (`torch.FloatTensor` of shape `(batch_size, output_dim`): The image embeddings obtained by
    applying the projection layer to the pooled output of [`Siglip2VisionModel`].

Examples:

```python
>>> from PIL import Image
>>> import requests
>>> from transformers import AutoProcessor, AutoModel
>>> import torch

>>> model = AutoModel.from_pretrained("google/siglip2-base-patch16-224")
>>> processor = AutoProcessor.from_pretrained("google/siglip2-base-patch16-224")

>>> url = "http://images.cocodataset.org/val2017/000000039769.jpg"
>>> image = Image.open(requests.get(url, stream=True).raw)

>>> inputs = processor(images=image, return_tensors="pt")

>>> with torch.no_grad():
...     image_features = model.get_image_features(**inputs)
```
r¦  )rM   rÚ   ré   r   r  )rD   r…   r¤  rc   rÚ   ré   Úvision_outputsrU  s           r0   Úget_image_featuresÚSiglip2Model.get_image_featuresè  su   € ðP 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð 6:×5FÑ5FØ%Ø/Ø)Ø/Ø!5ð 6Gð 6
ˆð '×4Ñ4ˆàÐr/   Úreturn_lossc
           
      óø  • Ub  UOU R                   R                  nU	b  U	OU R                   R                  n	U R                  UUUUU	S9n
U R	                  UUUUU	S9nU
R
                  nUR
                  nXÌR                  SSSS9-  nXÝR                  SSSS9-  n[        R                  " XÜR                  5       R                  UR                  5      5      nU R                  R                  UR                  5      U R                  R                  UR                  5      nnXïR                  5       -  U-   nUR                  5       nSnU(       a  [        R                  " UR!                  S5      UR                  S	9n[        R"                  " U5      * SU-  -   n[        R$                  R&                  R)                  UU-  5      n[        R*                  " USS
9* nUR-                  5       n[/        UUUUUUU
S9$ )a<  
pixel_attention_mask (`torch.Tensor` of shape `(batch_size, image_size, image_size)`, *optional*):
    Mask to avoid performing attention on padding pixel indices.
spatial_shapes (`torch.LongTensor` of shape `(batch_size, 2)`):
    Tensor containing the spatial dimensions (height, width) of the input images.
return_loss (`bool`, *optional*):
    Whether or not to return the contrastive loss.

Examples:

```python
>>> from PIL import Image
>>> import requests
>>> from transformers import AutoProcessor, AutoModel
>>> import torch

>>> model = AutoModel.from_pretrained("google/siglip2-base-patch16-224")
>>> processor = AutoProcessor.from_pretrained("google/siglip2-base-patch16-224")

>>> url = "http://images.cocodataset.org/val2017/000000039769.jpg"
>>> image = Image.open(requests.get(url, stream=True).raw)

>>> texts = ["a photo of 2 cats", "a photo of 2 dogs"]
>>> # important: we pass `padding=max_length` since the model was trained with this
>>> inputs = processor(text=texts, images=image, padding="max_length", return_tensors="pt")

>>> with torch.no_grad():
...     outputs = model(**inputs)

>>> logits_per_image = outputs.logits_per_image
>>> probs = torch.sigmoid(logits_per_image) # these are the probabilities
>>> print(f"{probs[0][0]:.1%} that image 0 is '{texts[0]}'")
31.9% that image 0 is 'a photo of 2 cats'
```
Nr¦  rŠ  ri   rf   T)r   rœ   Úkeepdimr   )rg   ©rœ   )r8   r9   r:   r4   r    r;   r<   )rM   rÚ   ré   r   r  r  Únormr*   rŸ   Útru   rg   rj  rl  ÚexpÚeyerl   Ú	ones_likerV   r    Ú
logsigmoidÚsumr.  r6   )rD   r  r…   r¤  rc   r—   r  r¹  rÚ   ré   r¶  r²  r    r4   r:   rj  rl  r9   r8   rÀ  Úm1_diag1ÚloglikÚnlls                          r0   rŒ   ÚSiglip2Model.forward!  sø  € ðd 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð 6:×5FÑ5FØ%Ø/Ø)Ø/Ø!5ð 6Gð 6
ˆð 48·?±?ØØ)Ø%Ø/Ø!5ð 4Cð 4
ˆð &×3Ñ3ˆØ"×0Ñ0ˆð $×&7Ñ&7¸!ÀÈTÐ&7Ð&RÑRˆØ!×$4Ñ$4°q¸bÈ$Ð$4Ð$OÑOˆô  Ÿ,š, {·N±NÓ4D×4GÑ4GÈ×HZÑHZÓ4[Ó\ˆà"&×"2Ñ"2×"5Ñ"5°k×6HÑ6HÓ"IÈ4Ï?É?×K]ÑK]Ð^i×^pÑ^pÓKqZˆØ)¯O©OÓ,=Ñ=À
ÑJˆà*×,Ñ,Ó.ÐàˆÞä—)’)˜O×0Ñ0°Ó3¸O×<RÑ<RÑSˆCÜŸš¨Ó8Ð8¸1¸s¹7ÑBˆHÜ—X‘X×(Ñ(×3Ñ3°H¸Ñ4NÓOˆFÜ—9’9˜V¨Ñ,Ð,ˆCØ—8‘8“:ˆDäØØ-Ø+Ø#Ø%Ø*Ø .ñ
ð 	
r/   )rl  rj  r  r   rW  )	NNNNNNNNN)r%   r&   r'   r(   r   r,   rR   r   r   r*   r   rß   r+   r³  r   r·  r   r6   rŒ   r.   r‘   r’   s   @r0   rh  rh  –  s  ø‡ àÓð˜}÷ ð@ ð -1Ø15Ø/3Ø,0Ø/3ñ+à˜EŸL™LÑ)ð+ð ! §¡Ñ.ð+ð ˜uŸ|™|Ñ,ð	+ð
 $ D™>ð+ð ' t™nð+ð 
×	Ñ	ô+ó ð+ðZ ð 59Ø7;Ø59Ø,0Ø/3ñ6à˜u×0Ñ0Ñ1ð6ð ' u§|¡|Ñ4ð6ð ! ×!1Ñ!1Ñ2ð	6ð
 $ D™>ð6ð ' t™nð6ð 
×	Ñ	ô6ó ð6ðp Øð 15Ø48Ø7;Ø59Ø15Ø37Ø&*Ø,0Ø/3ñe
à˜E×,Ñ,Ñ-ðe
ð ˜u×0Ñ0Ñ1ðe
ð ' u§|¡|Ñ4ð	e
ð
 ! ×!1Ñ!1Ñ2ðe
ð ! §¡Ñ.ðe
ð ˜u×/Ñ/Ñ0ðe
ð ˜d‘^ðe
ð $ D™>ðe
ð ' t™nðe
ð 
ôe
ó ó öe
r/   rh  z®
    Siglip2 vision encoder with an image classification head on top (a linear layer on top of the pooled final hidden states of
    the patch tokens) e.g. for ImageNet.
    c                   óö   ^ • \ rS rSrSrS\SS4U 4S jjr\\      SS\	\
R                     S\	\
R                     S\	\
R                     S	\	\
R                     S
\	\   S\	\   S\4S jj5       5       rSrU =r$ )rn  i‹  r…   rM   r=   Nc                 ó„  >• [         TU ]  U5        UR                  U l        [        R	                  UR
                  5      nUR                  U l        UR                  S:”  a5  [        R                  " UR
                  R                  UR                  5      O[        R                  " 5       U l        U R                  5         g )Nr   )rQ   rR   Ú
num_labelsrž  r¯  r]  r   rV   rW   rS   ÚIdentityro  r€  )rD   rM   r   r`   s      €r0   rR   Ú&Siglip2ForImageClassification.__init__”  s”   ø€ Ü‰Ñ˜Ô à ×+Ñ+ˆŒô *×6Ñ6°v×7KÑ7KÓLˆØ(×5Ñ5ˆÔð OU×N_ÑN_ÐbcÓNcŒBIŠIf×*Ñ*×6Ñ6¸×8IÑ8IÔJÔik×itÒitÓivð 	Œð
 	‰Õr/   r¤  rc   ÚlabelsrÚ   ré   c                 ó4  • Ub  UOU R                   R                  nUb  UOU R                   R                  nU R                  UUUUUS9nUR                  nUbL  US   R                  UR                  5      n	[        R                  " X‰-  SS9[        R                  " U	SS9-  nO[        R                  " USS9nU R                  U5      n
SnUGb©  UR                  U
R                  5      nU R                   R                  c‘  U R                  S:X  a  SU R                   l        OoU R                  S:”  aN  UR                  [        R                  :X  d  UR                  [        R                  :X  a  SU R                   l        OSU R                   l        U R                   R                  S:X  aI  [!        5       nU R                  S:X  a&  U" U
R#                  5       UR#                  5       5      nOŒU" X¤5      nOƒU R                   R                  S:X  a=  [%        5       nU" U
R'                  S	U R                  5      UR'                  S	5      5      nO,U R                   R                  S:X  a  [)        5       nU" X¤5      n[+        UU
UR,                  UR.                  S
9$ )a˜  
pixel_attention_mask (`torch.Tensor` of shape `(batch_size, image_size, image_size)`, *optional*):
    Mask to avoid performing attention on padding pixel indices.
spatial_shapes (`torch.LongTensor` of shape `(batch_size, 2)`):
    Tensor containing the spatial dimensions (height, width) of the input images.
labels (`torch.LongTensor` of shape `(batch_size,)`, *optional*):
    Labels for computing the image classification/regression loss. Indices should be in `[0, ...,
    config.num_labels - 1]`. If `config.num_labels == 1` a regression loss is computed (Mean-Square loss), If
    `config.num_labels > 1` a classification loss is computed (Cross-Entropy).

Examples:

```python
>>> from transformers import AutoImageProcessor, Siglip2ForImageClassification
>>> import torch
>>> from PIL import Image
>>> import requests

>>> torch.manual_seed(3)  # doctest: +IGNORE_RESULT
>>> url = "http://images.cocodataset.org/val2017/000000039769.jpg"
>>> image = Image.open(requests.get(url, stream=True).raw)

>>> # note: we are loading a `Siglip2Model` from the hub here,
>>> # so the head will be randomly initialized, hence the predictions will be random if seed is not set above.
>>> image_processor = AutoImageProcessor.from_pretrained("google/siglip2-base-patch16-224")
>>> model = Siglip2ForImageClassification.from_pretrained("google/siglip2-base-patch16-224")

>>> inputs = image_processor(images=image, return_tensors="pt")
>>> outputs = model(**inputs)
>>> logits = outputs.logits
>>> # model predicts one of the two classes
>>> predicted_class_idx = logits.argmax(-1).item()
>>> print("Predicted class:", model.config.id2label[predicted_class_idx])
Predicted class: LABEL_1
```
N)r—   rc   rÚ   ré   ).Nr   r¼  Ú
regressionÚsingle_label_classificationÚmulti_label_classificationrf   )r8   Úlogitsr"   r#   )rM   rÚ   ré   r   r!   ru   rg   r*   rÃ  r.  ro  Úproblem_typerÊ  rh   Úlongr[   r
   Úsqueezer	   r»   r   r   r"   r#   )rD   r…   r¤  rc   rÍ  rÚ   ré   rÝ   Úsequence_outputÚ	pool_maskrÒ  r8   Úloss_fcts                r0   rŒ   Ú%Siglip2ForImageClassification.forward¦  s2  € ð^ 2CÑ1NÑ-ÐTX×T_ÑT_×TqÑTqÐà$8Ñ$DÑ È$Ï+É+×JjÑJjð 	ð /3×.?Ñ.?ØØ/Ø)Ø/Ø!5ð /@ð /
ˆð "×3Ñ3ˆð  Ñ+Ø,¨YÑ7×:Ñ:¸?×;QÑ;QÓRˆIÜ#Ÿiši¨Ñ(CÈÑKÌeÏiÊiÐXaÐghÑNiÑi‰Oä#Ÿjšj¨¸aÑ@ˆOð —‘ Ó1ˆàˆØÒà—Y‘Y˜vŸ}™}Ó-ˆFØ{‰{×'Ñ'Ñ/Ø—?‘? aÓ'Ø/;D—K‘KÕ,Ø—_‘_ qÓ(¨f¯l©l¼e¿j¹jÓ.HÈFÏLÉLÔ\a×\eÑ\eÓLeØ/LD—K‘KÕ,à/KD—K‘KÔ,à{‰{×'Ñ'¨<Ó7Ü"›9Ø—?‘? aÓ'Ù# F§N¡NÓ$4°f·n±nÓ6FÓG‘Dá# FÓ3‘DØ—‘×)Ñ)Ð-JÓJÜ+Ó-Ù §¡¨B°·±Ó @À&Ç+Á+ÈbÃ/ÓR‘Ø—‘×)Ñ)Ð-IÓIÜ,Ó.Ù Ó/ä$ØØØ!×/Ñ/Ø×)Ñ)ñ	
ð 	
r/   )ro  rÊ  r   )NNNNNN)r%   r&   r'   r(   r©  r   rR   r   r   r   r*   r   r   rß   r   rŒ   r.   r‘   r’   s   @r0   rn  rn  ‹  sÈ   ø† ð %€Oð˜}ð °÷ ð$ Øð 04Ø7;Ø59Ø)-Ø,0Ø/3ñd
à˜uŸ|™|Ñ,ðd
ð ' u§|¡|Ñ4ðd
ð ! ×!1Ñ!1Ñ2ð	d
ð
 ˜Ÿ™Ñ&ðd
ð $ D™>ðd
ð ' t™nðd
ð 
ôd
ó ó öd
r/   rn  )rh  rY  r}  rž  rn  )rº   )rº   r  g       Àr  )r  r9  r>  )Fr  r&  Údataclassesr   Útypingr   r   r   r   Únumpyr_  r*   Útorch.nnrV   Útorch.nn.functionalr    rx   r   r	   r
   Útorch.nn.initr   Úactivationsr   Úmodeling_attn_mask_utilsr   Úmodeling_layersr   Úmodeling_outputsr   r   r   Úmodeling_utilsr   r   Úutilsr   r   r   Úconfiguration_siglip2r   r   r   r   r2   r6   r  rK   r   Úfloatr¦   r¨   rÄ   rÏ   rá   ró   r	  r4  r7  rE  rJ  rL  rN  rY  r}  rû   rž  rh  rn  Ú__all__r$   r/   r0   Ú<module>ré     sÞ  ðó* Û Ý !ß 1Ó 1ã Û Ý ß Ð ß AÑ AÝ 7å !Ý BÝ 9ß bÑ bß Fß BÑ Bß XÑ Xð Ùðñô
	?˜+ó 	?óó ð	?ð Ùðñô
	?˜ó 	?óó ð	?ð Øô 
Kó  
ó ó ð 
ôFb˜bŸi™iô bðX ñ%ØI‰Ið%à<‰<ð%ð 
‰ð%ð <‰<ð	%ð
 ˜UŸ\™\Ñ*ð%ð ð%ð õ%ô.;)r—y‘yô ;)ô|—‘ô ô-Ð4ô -ô`M
R—Y‘Yô M
ô`:
˜rŸy™yô :
ôz%˜BŸI™Iô %òP! ðJ \_ñ$ØL‰Lð$Ø %ð$Ø27ð$ØBGð$ØSXð$à
‡\\õ$ô4Aò2NòDô<
˜RŸY™Yô <
ð~ ô<*˜_ó <*ó ð<*ñ~ ðñô
0
Ð-ó 0
óð
0
ôf"¨2¯9©9ô "ñ> ðñô
8
Ð/ó 8
óð
8
ðv ôq
Ð)ó q
ó ðq
ñh ðñô{
Ð$:ó {
óð{
ò|r/   