ó
    <±h­  ã                   ó  • S r SSKrSSKJrJrJr  SSKrSSKJs  J	r
  SSKJr  SSKJr  SSKJr  SSKJr  SS	KJr  SS
KJr  SSKJrJr  SSKJr  SSKJr  SSKJr  SSKJrJ r   SSK!J"r"  SSK#J$r$J%r%J&r&J'r'J(r(J)r)J*r*J+r+  SSK,J-r-J.r.  \ " 5       (       a  SSK/J0r0   " S S\5      r1 " S S\'5      r2 " S S\(5      r3   S=S\Rh                  S\Rj                  S\Rj                  S\Rj                  S\\Rj                  S 4   S!\\6   S"\\6   S#\\Rj                     S$\7\Rj                  \Rj                  4   4S% jjr8\" 5       r9\8\9S&'    " S' S(\Rh                  5      r: " S) S*\%5      r; " S+ S,\Rh                  5      r< " S- S.\5      r= " S/ S0\&5      r> " S1 S2\.5      r?    S>S3\\Rj                  \7\Rj                     S4   S4\\@   S5\\@   S6\@S\\Rj                     S$\\Rj                  \@4   4S7 jjrA " S8 S9\-5      rB " S: S;\$5      rC/ S<QrDg)?zPyTorch Doge model.é    N)ÚCallableÚOptionalÚUnion)Únné   )ÚACT2FN)ÚCache)ÚPretrainedConfig)Úcompile_friendly_flex_attention)ÚGradientCheckpointingLayer)ÚMoeCausalLMOutputWithPastÚMoeModelOutputWithPast)Úrope_config_validation)ÚAttentionInterface)ÚUnpack)ÚTransformersKwargsÚis_torch_flex_attn_available)ÚOutputRecorderé   )ÚLlamaForSequenceClassificationÚLlamaMLPÚLlamaPreTrainedModelÚLlamaRMSNormÚLlamaRotaryEmbeddingÚapply_rotary_pos_embÚeager_attention_forwardÚ	repeat_kv)ÚMixtralForCausalLMÚMixtralModel)Ú	BlockMaskc                   óø   ^ • \ rS rSrSrSrS/r0 SS_SS_SS_S	S
_SS
_SS_SS_SS_SS_SS_SS_SS_SS
_SS_SS_SS_rS/S/4SS/S/4S/S/4S.r                          S!U 4S jjr	S r
U =r$ )"Ú
DogeConfigé6   a0  
This is the configuration class to store the configuration of a [`DogeModel`]. It is used to instantiate an Doge
model according to the specified arguments, defining the model architecture like [SmallDoge/Doge-320M](https://huggingface.co/SmallDoge/Doge-320M).

Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
documentation from [`PretrainedConfig`] for more information.

Args:
    vocab_size (`int`, *optional*, defaults to 32768):
        Vocabulary size of the Doge2 model. Defines the number of different tokens that can be represented by the `inputs_ids` passed when calling [`DogeModel`]
    hidden_size (`int`, *optional*, defaults to 1024):
        Dimension of the hidden representations.
    intermediate_size (`int`, *optional*, defaults to 2048):
        Dimension of the MLP representations.
    num_hidden_layers (`int`, *optional*, defaults to 32):
        Number of hidden layers in the Transformer decoder.
    hidden_dropout (`float`, *optional*, defaults to 0.0):
        Dropout probability for each sequence transformation and state transformation module.
    hidden_act (`str` or `function`, *optional*, defaults to `"silu"`):
        The non-linear activation function (function or string) in the decoder.
    initializer_range (`float`, *optional*, defaults to 0.02):
        The standard deviation of the truncated_normal_initializer for initializing all weight matrices.
    rms_norm_eps (`float`, *optional*, defaults to 1e-06):
        The epsilon used by the rms normalization layers.
    use_cache (`bool`, *optional*, defaults to `True`):
        Whether or not the model should return the last key/values attentions (not used by all models). Only
        relevant if `config.is_decoder=True`.
    tie_word_embeddings (`bool`, *optional*, defaults to `False`):
        Whether the model's input and output word embeddings should be tied.
    max_position_embeddings (`int`, *optional*, defaults to 2048):
        The maximum sequence length that this model might ever be used with.
    rope_theta (`float`, *optional*, defaults to 10000.0):
        The base period of the RoPE embeddings.
    rope_scaling (`Dict`, *optional*):
        Dictionary containing the scaling configuration for the RoPE embeddings.
        NOTE: if you apply new rope type and you expect the model to work on longer `max_position_embeddings`, we recommend you to update this value accordingly.
        Doge family of small models use `{ 'rope_type': 'dynamic', 'factor': 4.0, 'original_max_position_embeddings': 2048 }` as the default value.
        Expected contents:
            `rope_type` (`str`):
                The sub-variant of RoPE to use. Can be one of ['default', 'linear', 'dynamic', 'yarn', 'longrope', 'llama3'], with 'default' being the original RoPE implementation.
            `factor` (`float`, *optional*):
                Used with all rope types except 'default'. The scaling factor to apply to the RoPE embeddings.
                In most scaling types, a `factor` of x will enable the model to handle sequences of length x * original maximum pre-trained length.
            `original_max_position_embeddings` (`int`, *optional*):
                Used with 'dynamic', 'longrope' and 'llama3'.
                The original max position embeddings used during pretraining.
            `attention_factor` (`float`, *optional*):
                Used with 'yarn' and 'longrope'. The scaling factor to be applied on the attention
                computation.
                If unspecified, it defaults to value recommended by the implementation, using the `factor` field to infer the suggested value.
            `beta_fast` (`float`, *optional*):
                Only used with 'yarn'. Parameter to set the boundary for extrapolation (only) in the linear
                ramp function. If unspecified, it defaults to 32.
            `beta_slow` (`float`, *optional*):
                Only used with 'yarn'. Parameter to set the boundary for interpolation (only) in the linear
                ramp function. If unspecified, it defaults to 1.
            `short_factor` (`List[float]`, *optional*):
                Only used with 'longrope'. The scaling factor to be applied to short contexts (<`original_max_position_embeddings`).
                Must be a list of numbers with the same length as the hidden size divided by the number of attention heads divided by 2
            `long_factor` (`List[float]`, *optional*):
                Only used with 'longrope'. The scaling factor to be applied to long contexts (<`original_max_position_embeddings`).
                Must be a list of numbers with the same length as the hidden size divided by the number of attention heads divided by 2
            `low_freq_factor` (`float`, *optional*):
                Only used with 'llama3'. Scaling factor applied to low frequency components of the RoPE
            `high_freq_factor` (`float`, *optional*):
                Only used with 'llama3'. Scaling factor applied to high frequency components of the RoPE
    num_attention_heads (`int`, *optional*, defaults to 8):
        Number of attention heads for each attention layer in the Transformer decoder.
    num_key_value_heads (`int`, *optional*):
        This is the number of key_value heads that should be used to implement Grouped Query Attention.
        If `num_key_value_heads=num_attention_heads`, the model will use Multi Head Attention (MHA), if
        `num_key_value_heads=1` the model will use Multi Query Attention (MQA) otherwise GQA is used.
        When converting a multi-head checkpoint to a GQA checkpoint, each group key and value head should be constructed by meanpooling all the original heads within that group.
        For more details checkout [this paper](https://arxiv.org/pdf/2305.13245.pdf).
        If it is not specified, will default to `num_attention_heads`.
    attention_bias (`bool`, defaults to `False`, *optional*, defaults to `False`):
        Whether to use a bias in the query, key, value and output projection layers during self-attention.
    attention_dropout (`float`, *optional*, defaults to 0.0):
        The dropout ratio for the attention probabilities.
    mlp_bias (`bool`, *optional*, defaults to `False`):
        Whether to use a bias in up_proj, down_proj and gate_proj layers in the MLP layers.
    sliding_window (`int`, *optional*):
        Sliding window attention window size. If not specified, will default to `None`.
    keep_window_size (`int`, *optional*, defaults to 2048):
        The window size of tokens that are not dynamically masked, and dynamic masking is only performed when the sequence length exceeds this value.
    is_moe (`bool`, *optional*, defaults to `False`):
        Whether to use the Cross Domain Mixture of Experts, if `True`, the MoE will inherit the MLP to initialize.
    num_experts (`int`, *optional*, defaults to 16384):
        Number of routed experts in the model. This is only used when `is_moe=True`.
    num_experts_per_tok (`int`, *optional*, defaults to 64):
        Number of selected experts to route per-token.
    norm_topk_prob (`bool`, *optional*, defaults to `False`):
        Whether to normalize the topk probabilities.
    output_router_logits (`bool`, *optional*, defaults to `False`):
        Whether or not the router logits should be returned by the model. Enabling this will also
        allow the model to output the auxiliary loss, including load balancing loss and router z-loss.
    router_aux_loss_coef (`float`, *optional*, defaults to 0.001):
        The aux loss factor for the total loss.

```python
>>> from transformers import DogeConfig, DogeModel

>>> # Initializing a Doge-320M style configuration
>>> configuration = DogeConfig()

>>> # Initializing a model from the Doge-320M style configuration
>>> model = DogeModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```ÚdogeÚpast_key_valueszlayers.*.self_attn.q_projÚcolwisezlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.dt_projÚrowwisezlayers.*.self_attn.o_projzlayers.*.input_layernorm.weightÚsequence_parallelzlayers.*.input_residual.weightz(layers.*.post_attention_layernorm.weightz'layers.*.post_attention_residual.weightznorm.weightzlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_projzlayers.*.mlp.router_gateÚcolwise_repzlayers.*.mlp.down_embedÚrowwise_repzlayers.*.mlp.up_embedÚ	input_idsÚinputs_embedsÚhidden_statesÚattention_mask)Úembed_tokensÚlayersÚnormc                 ó  >• Xl         X l        X0l        X@l        XPl        X`l        Xpl        X€l        Xl        X°l	        XÀl
        XÐl        Xàl        Xðl        UU l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        U R                  b,  SU R                  ;   a  U R                  S   U R                  S'   [3        U 5        Uc  Xàl        [4        TU ]l  " SSU
0UD6  g )NÚtypeÚ	rope_typeÚtie_word_embeddings© )Ú
vocab_sizeÚhidden_sizeÚintermediate_sizeÚnum_hidden_layersÚhidden_dropoutÚ
hidden_actÚinitializer_rangeÚrms_norm_epsÚ	use_cacheÚmax_position_embeddingsÚ
rope_thetaÚrope_scalingÚnum_attention_headsÚnum_key_value_headsÚattention_biasÚattention_dropoutÚmlp_biasÚsliding_windowÚkeep_window_sizeÚis_moeÚnum_expertsÚnum_experts_per_tokÚnorm_topk_probÚoutput_router_logitsÚrouter_aux_loss_coefr   ÚsuperÚ__init__)Úselfr7   r8   r9   r:   r;   r<   r=   r>   r?   r5   r@   rA   rB   rC   rD   rE   rF   rG   rH   rI   rJ   rK   rL   rM   rN   rO   ÚkwargsÚ	__class__s                               €Ú]/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/doge/modular_doge.pyrQ   ÚDogeConfig.__init__Â   s  ø€ ð< %ŒØ&ÔØ!2ÔØ!2Ôà,ÔØ$ŒØ!2ÔØ(ÔØ"Œà'>Ô$Ø$ŒØ(ÔØ#6Ô Ø#6Ô Ø,ˆÔØ!2ˆÔØ ˆŒØ,ˆÔØ 0ˆÔØˆŒØ&ˆÔØ#6ˆÔ Ø,ˆÔØ$8ˆÔ!Ø$8ˆÔ!ð ×ÑÑ(¨V°t×7HÑ7HÓ-HØ-1×->Ñ->¸vÑ-FˆD×Ñ˜kÑ*Ü˜tÔ$ð Ñ&Ø':Ô$ä‰Òñ 	
Ø 3ð	
àó	
ó    )rE   rF   r<   r;   r8   r=   r9   rJ   rI   r@   rG   rM   rC   rK   rL   r:   rD   rN   r>   rB   rA   rO   rH   r?   r7   )i €  i   é   é    ç        Úsilug{®Gáz”?gíµ ÷Æ°>TFrX   g     ˆÃ@Né   NFrZ   FNrX   Fi @  é@   FFgü©ñÒMbP?)Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Ú
model_typeÚkeys_to_ignore_at_inferenceÚbase_model_tp_planÚbase_model_pp_planrQ   Ú__static_attributes__Ú__classcell__©rT   s   @rU   r"   r"   6   su  ø† ñnð` €JØ#4Ð"5ÐðØ# Yðà# Yðð 	$ Yðð 	% ið	ð
 	$ Yðð 	*Ð+>ðð 	)Ð*=ðð 	3Ð4Gðð 	2Ð3Fðð 	Ð*ðð 	! )ðð 	 	ðð 	! )ðð 	# Mðð 	" =ðð  	  ð!Ðð& &˜¨Ð(9Ð:Ø#Ð%5Ð6¸Ð8IÐJØ!Ð" _Ð$5Ð6ñÐð ØØØØØØØØØ!Ø $ØØØØ ØØØØØØØØØØ"Ø"÷7G
õ G
rW   r"   c                   ó   • \ rS rSrSrg)ÚDogeRMSNormi  r6   N©r^   r_   r`   ra   rg   r6   rW   rU   rk   rk     ó   † ÚrW   rk   c                   ó   • \ rS rSrSrg)ÚDogeRotaryEmbeddingi  r6   Nrl   r6   rW   rU   ro   ro     rm   rW   ro   ÚmoduleÚqueryÚkeyÚvaluer.   r    ÚscalingÚsoftcapÚ	head_maskÚreturnc                 ó6  ^^^• S n	S m[        U[        5      (       a  Un	OUmTb  TS S 2S S 2S S 2S UR                  S   24   mUUU4S jn
[        UUUU
U	SUSS9u  p¼UR	                  UR
                  5      nUR                  SS5      R                  5       nX¼4$ )Néþÿÿÿc                 ó–   >• Tb  T[         R                  " U T-  5      -  n Tb  U TU   U   U   U   -   n Tb  U TU   U   S   S   -   n U $ )Nr   )ÚtorchÚtanh)ÚscoreÚ	batch_idxÚhead_idxÚq_idxÚkv_idxÚcausal_maskrv   ru   s        €€€rU   Ú	score_modÚ)flex_attention_forward.<locals>.score_mod)  sm   ø€ ØÑØœeŸjšj¨°©Ó9Ñ9ˆEØÑ"Ø˜K¨	Ñ2°8Ñ<¸UÑCÀFÑKÑKˆEØÑ Ø˜I iÑ0°Ñ:¸1Ñ=¸aÑ@Ñ@ˆEØˆrW   T)rƒ   Ú
block_maskÚ
enable_gqaÚscaleÚ
return_lseé   r   )Ú
isinstancer    Úshaper   ÚtoÚdtypeÚ	transposeÚ
contiguous)rp   rq   rr   rs   r.   rt   ru   rv   rS   r…   rƒ   Úattn_outputÚattention_weightsr‚   s         ``     @rU   Úflex_attention_forwardr’     sµ   ú€ ð €JØ€KÜ.¤)×,Ñ,Ø#‰
à$ˆàÑØ!¢!¢Qª¨?¨S¯Y©Y°r©]¨?Ð":Ñ;ˆ÷ô &EØØØØØØØð ñ&Ñ"€Kð *×,Ñ,¨U¯[©[Ó9ÐØ×'Ñ'¨¨1Ó-×8Ñ8Ó:€KàÐ)Ð)rW   Údoge_flex_attentionc                   ó¨  ^ • \ rS rSrSS\S\\   4U 4S jjjr   SS\R                  S\
\R                  \R                  4   S\\R                     S\\   S	\\R                     S
\
\R                  \\R                     \\
\R                        4   4S jjr  SS\R                  S\R                  S\S\\R                     4S jjrSrU =r$ )ÚDogeAttentioniI  ÚconfigÚ	layer_idxc                 óî  >• [         TU ]  5         Xl        X l        [	        USUR
                  UR                  -  5      U l        UR                  UR                  -  U l	        U R                  S-  U l
        UR                  U l        UR                  U l        [        R                  " UR
                  UR                  U R                  -  UR                  S9U l        [        R                  " UR
                  UR                  U R                  -  UR                  S9U l        [        R                  " UR
                  UR                  U R                  -  UR                  S9U l        [        R&                  " [(        R*                  " UR                  5      5      U l        [        R                  " UR                  U R                  -  UR                  UR                  S9U l        [        R                  " UR                  U R                  -  UR
                  UR                  S9U l        [3        U R                  UR4                  S9U l        [3        U R                  UR4                  S9U l        g )NÚhead_dimg      à¿©Úbias©Úeps)rP   rQ   r–   r—   Úgetattrr8   rC   r™   rD   Únum_key_value_groupsrt   rF   rI   r   ÚLinearrE   Úq_projÚk_projÚv_projÚ	Parameterr{   ÚzerosÚAÚdt_projÚo_projrk   r>   Úq_normÚk_norm©rR   r–   r—   rT   s      €rU   rQ   ÚDogeAttention.__init__J  sÖ  ø€ Ü‰ÑÔØŒØ"ŒÜ ¨
°F×4FÑ4FÈ&×JdÑJdÑ4dÓeˆŒØ$*×$>Ñ$>À&×B\ÑB\Ñ$\ˆÔ!Ø—}‘} dÑ*ˆŒØ!'×!9Ñ!9ˆÔØ &× 7Ñ 7ˆÔä—i’iØ×Ñ × :Ñ :¸T¿]¹]Ñ JÐQW×QfÑQfñ
ˆŒô —i’iØ×Ñ × :Ñ :¸T¿]¹]Ñ JÐQW×QfÑQfñ
ˆŒô —i’iØ×Ñ × :Ñ :¸T¿]¹]Ñ JÐQW×QfÑQfñ
ˆŒô —’œeŸkšk¨&×*DÑ*DÓEÓFˆŒÜ—y’yØ×&Ñ&¨¯©Ñ6¸×8RÑ8RÐY_×YnÑYnñ
ˆŒô —i’iØ×&Ñ&¨¯©Ñ6¸×8JÑ8JÐQW×QfÑQfñ
ˆŒô " $§-¡-°V×5HÑ5HÑIˆŒÜ! $§-¡-°V×5HÑ5HÑIˆrW   r-   Úposition_embeddingsr.   Úpast_key_valueÚcache_positionrw   c                 óú  • UR                   S S n/ UQSPU R                  P7nU R                  U R                  U5      R	                  U5      5      R                  SS5      n	U R                  U R                  U5      R	                  U5      5      R                  SS5      n
U R                  U5      R	                  U5      R                  SS5      nUu  pÍ[        XšXÍ5      u  pšUb$  XÜUS.nUR                  X«U R                  U5      u  p«U R                  UR                  SS5      R                  UR                   S   UR                   S   S5      5      n[        R                  " U R                   ["        R$                  " U5      -  5      R                  SS5      nU R'                  UUU R(                  US9n[+        UU R,                  5      n[.        nU R0                  R2                  S:w  a  [4        U R0                  R2                     nU" U U	U
U4UU R6                  (       d  S	OU R8                  U R:                  S
.UD6u  nnUR                  " / UQSP76 R=                  5       nU R?                  U5      nUU4$ )Néÿÿÿÿr‰   r   )ÚsinÚcosr¯   r   ry   )r-   Ú	dt_statesrI   r.   ÚeagerrZ   )r.   Údropoutrt   ) r‹   r™   r©   r¡   ÚviewrŽ   rª   r¢   r£   r   Úupdater—   r§   Úreshaper{   Úexpr¦   ÚFÚsoftplusÚprepare_dynamic_maskrI   r   rŸ   r   r–   Ú_attn_implementationÚALL_ATTENTION_FUNCTIONSÚtrainingrF   rt   r   r¨   )rR   r-   r­   r.   r®   r¯   rS   Úinput_shapeÚhidden_shapeÚquery_statesÚ
key_statesÚvalue_statesr³   r²   Úcache_kwargsr´   Ú	attn_maskÚattention_interfacer   Úattn_weightss                       rU   ÚforwardÚDogeAttention.forwardh  s^  € ð $×)Ñ)¨#¨2Ð.ˆØ8˜Ð8 bÐ8¨$¯-©-Ñ8ˆà—{‘{ 4§;¡;¨}Ó#=×#BÑ#BÀ<Ó#PÓQ×[Ñ[Ð\]Ð_`ÓaˆØ—[‘[ §¡¨]Ó!;×!@Ñ!@ÀÓ!NÓO×YÑYÐZ[Ð]^Ó_ˆ
Ø—{‘{ =Ó1×6Ñ6°|ÓD×NÑNÈqÐRSÓTˆà&‰ˆÜ#7¸ÐRUÓ#[Ñ ˆàÑ%à#&ÀnÑUˆLØ'5×'<Ñ'<¸ZÐW[×WeÑWeÐgsÓ'tÑ$ˆJð —L‘LØ×"Ñ" 1 aÓ(×0Ñ0°×1CÑ1CÀAÑ1FÈ×HZÑHZÐ[]ÑH^Ð`bÓcó
ˆ	ô —I’I˜dŸf™f¤q§z¢z°)Ó'<Ñ<Ó=×GÑGÈÈBÓOˆ	Ø×-Ñ-Ø'ØØ!×2Ñ2Ø)ð	 .ð 
ˆ	ô ˜i¨×)BÑ)BÓCˆ	ä(?ÐØ;‰;×+Ñ+¨wÓ6Ü"9¸$¿+¹+×:ZÑ:ZÑ"[Ðá$7ØØØØð		%
ð
 %Ø#Ÿ}Ÿ}‘C°$×2HÑ2HØ—L‘Lñ	%
ð ñ	%
Ñ!ˆ\ð "×)Ò)Ð;¨;Ð;¸Ò;×FÑFÓHˆØ—k‘k +Ó.ˆØ˜LÐ(Ð(rW   r´   rI   c           	      ó  • [         R                  " UR                  5      R                  nUR                  nUSS2SS2SSS24   R	                  SSUR
                  S   S5      nUb¦  [        U[        5      (       d‘  UR                  [         R                  :X  aB  UR                  n[         R                  " U[         R                  " SUR                  US9U5      nUR                  USS2SS2SS2SUR
                  S   24   S:g  U5      nUR
                  S   U:”  ah  [         R                  " XvUR                  S9n[         R                  " XsSSS	S
9R                  n	UR!                  SU	S5      nUR                  US:H  U5      nU$ )aø  
The core idea of DMA is to calculate the dynamic attention mask to mask the tokens that should be masked, so as to form sparse attention.

Combine `dt_states` with `attention_mask` to generate the final `attn_mask`.

Args:
    hidden_states (`torch.Tensor`): The input hidden_states, used to determine the minimum value of the current input precision.
    dt_states (`torch.Tensor`): dt_states of shape `(batch_size, num_heads, key_sequence_length)`.
    keep_window_size (`int`): The window size of tokens that are not dynamically masked, and dynamic masking is only performed when the sequence length exceeds this value.
    attention_mask (`torch.Tensor`, *optional*): attention mask of shape `(batch_size, 1, query_sequence_length, key_sequence_length)`.
Nr±   r‰   rZ   )Údevicer   r   ©r   rÍ   TF)ÚdimÚlargestÚsortedç      ð?)r{   Úfinfor   ÚminÚexpandr‹   rŠ   r    ÚboolÚwhereÚtensorrÍ   Úmasked_fillÚ
zeros_likeÚtopkÚindicesÚscatter)
rR   r-   r´   rI   r.   Ú	min_dtyper   rÇ   Úactive_maskÚtopk_indicess
             rU   r½   Ú"DogeAttention.prepare_dynamic_mask   se  € ô$ —K’K × 3Ñ 3Ó4×8Ñ8ˆ	Ø×#Ñ#ˆØša¢ Dª!˜mÑ,×3Ñ3ØM×'Ñ'¨Ñ*¨Bó
ˆ	ð Ñ%¬j¸Ì×.SÑ.SØ×#Ñ#¤u§z¡zÓ1Ø%×+Ñ+Ü!&§¢Ø"¤E§L¢L°¸^×=RÑ=RÐZ_Ñ$`Ðbkó"ð "×-Ñ-¨nºQÂÂ1ÐF[È	ÏÉÐXZÑH[ÐF[Ð=[Ñ.\Ð`aÑ.aÐclÓmˆIØ?‰?˜2ÑÐ!1Ó1Ü×*Ò*¨9È)×JZÑJZÑ[ˆKÜ Ÿ:š: iÀrÐSWÐ`eÑf×nÑnˆLØ%×-Ñ-¨b°,ÀÓDˆKØ!×-Ñ-¨k¸SÑ.@À)ÓLˆIØÐrW   )r¦   rF   r–   r§   r™   rª   r¢   rI   r—   rŸ   r¨   r©   r¡   rt   r£   ©N©NNN)rX   N)r^   r_   r`   ra   r"   r   ÚintrQ   r{   ÚTensorÚtupler	   Ú
LongTensorrÊ   r½   rg   rh   ri   s   @rU   r•   r•   I  s  ø† ñJ˜zð J°h¸s±m÷ Jð JðD 26Ø*.Ø59ñ6)à—|‘|ð6)ð # 5§<¡<°·±Ð#=Ñ>ð6)ð ! §¡Ñ.ð	6)ð
 ! ™ð6)ð ! ×!1Ñ!1Ñ2ð6)ð 
ˆu|‰|˜X e§l¡lÑ3°X¸eÀEÇLÁLÑ>QÑ5RÐRÑ	Sõ6)ðx !%Ø15ñ#à—|‘|ð#ð —<‘<ð#ð ð	#ð
 ! §¡Ñ.÷#ó #rW   r•   c                   ó   • \ rS rSrSrg)ÚDogeMLPiÆ  r6   Nrl   r6   rW   rU   ré   ré   Æ  rm   rW   ré   c                   ój   ^ • \ rS rSrS\4U 4S jjrS\R                  S\R                  4S jrSr	U =r
$ )Ú	DogeCDMoEiÊ  r–   c                 óè  >• [         TU ]  5         UR                  U l        UR                  U l        [        UR
                     U l        UR                  U l        [        R                  " [        R                  " U R                  5      5      U l        UR                  U l        UR                  U l        [        R                   " U R                  U R                  UR"                  S9U l        [        R                   " U R                  U R                  UR"                  S9U l        [        R                   " U R                  U R                  UR"                  S9U l        [        R                   " U R                  U R                  S-  SS9U l        [        R,                  " U R                  U R                  5      U l        [        R,                  " U R                  U R                  5      U l        g )Nrš   r   F)rP   rQ   r8   r9   r   r<   Úact_fnrK   ÚmathÚfloorÚsqrtÚnum_keysrL   Útop_krM   r   r    rG   Ú	gate_projÚup_projÚ	down_projÚrouter_gateÚ	EmbeddingÚ
down_embedÚup_embed©rR   r–   rT   s     €rU   rQ   ÚDogeCDMoE.__init__Ë  s_  ø€ Ü‰ÑÔØ!×-Ñ-ˆÔØ!'×!9Ñ!9ˆÔÜ˜V×.Ñ.Ñ/ˆŒà!×-Ñ-ˆÔÜŸ
š
¤4§9¢9¨T×-=Ñ-=Ó#>Ó?ˆŒØ×/Ñ/ˆŒ
Ø$×3Ñ3ˆÔô Ÿš 4×#3Ñ#3°T×5KÑ5KÐRX×RaÑRaÑbˆŒÜ—y’y ×!1Ñ!1°4×3IÑ3IÐPV×P_ÑP_Ñ`ˆŒÜŸš 4×#9Ñ#9¸4×;KÑ;KÐRX×RaÑRaÑbˆŒô Ÿ9š9 T×%5Ñ%5°t·}±}ÀqÑ7HÈuÑUˆÔô Ÿ,š, t×'7Ñ'7¸×9IÑ9IÓJˆŒÜŸš T×%5Ñ%5°t×7GÑ7GÓHˆrW   r-   rw   c                 óŒ  • UR                   u  p4nU R                  U5      R                  SX4-  S5      nUR                  U R                  SS9u  u  pxu  pšUR                  S5      UR                  S5      -   nU	R                  S5      U R                  -  U
R                  S5      -   nUR                  " / UR                   S S QSP76 nUR                  " / UR                   S S QSP76 nUR                  U R                  SS9u  pÞUR                  SU5      n[        R                  " USS9nU R                  (       a  UUR                  SSS9-  nU R                  U5      nU R                  U5      n[        R                  " UUR                  X4-  SS5      5      R                  X4-  S5      nU R!                  U5      U-  n[        R                  " UR                  X4-  SS5      U5      R                  X4S5      nU R#                  U R!                  U R%                  U5      5      U R'                  U5      -  5      nUU-   nX4$ )Nr   r±   ©rÏ   ry   T)rÏ   Úkeepdimr‰   )r‹   rö   r·   rÛ   rñ   Ú	unsqueezerò   Úgatherr»   ÚsoftmaxrM   Úsumrø   rù   r{   Úmatmulrí   rõ   ró   rô   )rR   r-   rS   ÚbszÚseq_lenÚ_Úrouter_logitsÚscores_xÚscores_yÚ	indices_xÚ	indices_yÚ
all_scoresÚall_indicesÚscoresÚposition_indicesrÜ   Úrouting_weightsrø   rù   Úexperts_weightsÚexperts_statess                        rU   rÊ   ÚDogeCDMoE.forwardâ  s+  € ð
 (×-Ñ-‰ˆað ×(Ñ(¨Ó7×<Ñ<¸QÀÁÈrÓRˆð 8E×7IÑ7IÈ$Ï-É-Ð]_Ð7IÐ7`Ñ4ÑˆÑ4˜yØ×'Ñ'¨Ó+¨h×.@Ñ.@ÀÓ.DÑDˆ
Ø×)Ñ)¨"Ó-°·±Ñ=À	×@SÑ@SÐTVÓ@WÑWˆØ—_’_Ð@ j×&6Ñ&6°s¸Ð&;Ð@¸RÒ@ˆ
Ø!×&Ò&ÐC¨×(9Ñ(9¸#¸2Ð(>ÐCÀÒCˆØ#-§?¡?°4·:±:À2 ?Ð#FÑ ˆØ×$Ñ$ RÐ)9Ó:ˆÜŸ)š) F°Ñ3ˆØ××Ø˜×2Ñ2°rÀ4Ð2ÐHÑHˆOð —_‘_ WÓ-ˆ
Ø—=‘= Ó)ˆÜŸ,š, z°=×3EÑ3EÀcÁmÐUWÐYZÓ3[Ó\×aÑaÐbeÑboÐqsÓtˆØŸ+™+ oÓ6¸ÑHˆÜŸš o×&:Ñ&:¸3¹=È!ÈRÓ&PÐRZÓ[×`Ñ`ÐadÐoqÓrˆØŸ™ t§{¡{°4·>±>À-Ó3PÓ'QÐTX×T`ÑT`ÐanÓToÑ'oÓpˆØ%¨Ñ6ˆØÐ+Ð+rW   )rí   rø   rõ   ró   r8   r9   rM   rK   rñ   rö   rò   rù   rô   )r^   r_   r`   ra   r"   rQ   r{   rå   rÊ   rg   rh   ri   s   @rU   rë   rë   Ê  s5   ø† ðI˜z÷ Ið.,à—|‘|ð,ð 
‰÷	,ò ,rW   rë   c                   ó  ^ • \ rS rSrSS\S\\   4U 4S jjjr     SS\R                  S\
\R                  \R                  4   S\\R                     S\\R                     S	\\
\R                        S
\\   S\\R                     S\\   S\
\R                  \\
\R                  \R                  4      4   4S jjrSrU =r$ )ÚDogeDecoderLayeri  r–   r—   c                 ó(  >• [         TU ]  5         UR                  U l        [        UR                  UR
                  S9U l        [        XS9U l        [        R                  " [        R                  " UR                  5      5      U l        [        UR                  UR
                  S9U l        UR                  (       d  [!        U5      O
[#        U5      U l        [        R                  " [        R                  " UR                  5      5      U l        g )Nrœ   )r–   r—   )rP   rQ   r;   rk   r8   r>   Úinput_layernormr•   Ú	self_attnr   r¤   r{   ÚonesÚinput_residualÚpost_attention_layernormrJ   ré   rë   ÚmlpÚpost_attention_residualr«   s      €rU   rQ   ÚDogeDecoderLayer.__init__  s¶   ø€ Ü‰ÑÔØ$×3Ñ3ˆÔä*¨6×+=Ñ+=À6×CVÑCVÑWˆÔÜ&¨fÑJˆŒÜ Ÿlšl¬5¯:ª:°f×6HÑ6HÓ+IÓJˆÔä(3°F×4FÑ4FÈF×L_ÑL_Ñ(`ˆÔ%Ø*0¯-¯-”7˜6”?¼YÀvÓ=NˆŒÜ')§|¢|´E·J²J¸v×?QÑ?QÓ4RÓ'SˆÕ$rW   r-   r­   r.   Úposition_idsr®   r?   r¯   rS   rw   c                 ó˜  • Un	U R                  U5      nU R                  " SUUUUUUUS.UD6u  p[        R                  " XR                  U R
                  S9nU R                  U	-  U-   nUn	U R                  U5      nU R                  U5      n[        R                  " XR                  U R
                  S9nU R                  U	-  U-   nU$ )N)r-   r­   r.   r  r®   r?   r¯   )ÚprÀ   r6   )
r  r  r»   r¶   r;   rÀ   r  r  r  r  )rR   r-   r­   r.   r  r®   r?   r¯   rS   ÚresidualÚself_attn_weightss              rU   rÊ   ÚDogeDecoderLayer.forward  sß   € ð !ˆØ×,Ñ,¨]Ó;ˆØ+/¯>ª>ð 	,
Ø'Ø 3Ø)Ø%Ø)ØØ)ñ	,
ð ñ	,
Ñ(ˆô Ÿ	š	 -×3FÑ3FÐQU×Q^ÑQ^Ñ_ˆØ×+Ñ+¨hÑ6¸ÑFˆð !ˆØ×5Ñ5°mÓDˆØŸ™ Ó/ˆÜŸ	š	 -×3FÑ3FÐQU×Q^ÑQ^Ñ_ˆØ×4Ñ4°xÑ?À-ÑOˆàÐrW   )r;   r  r  r  r  r  r  râ   )NNNFN)r^   r_   r`   ra   r"   r   rä   rQ   r{   rå   ræ   rç   rÖ   r   r   ÚFloatTensorrÊ   rg   rh   ri   s   @rU   r  r    s  ø† ñ
T˜zð 
T°h¸s±m÷ 
Tð 
Tð  26Ø37Ø8<Ø$)Ø59ñ"à—|‘|ð"ð # 5§<¡<°·±Ð#=Ñ>ð"ð ! §¡Ñ.ð	"ð
 ˜u×/Ñ/Ñ0ð"ð !  u§|¡|Ñ!4Ñ5ð"ð ˜D‘>ð"ð ! ×!1Ñ!1Ñ2ð"ð Ð+Ñ,ð"ð 
ˆu× Ñ  (¨5°×1BÑ1BÀE×DUÑDUÐ1UÑ+VÑ"WÐWÑ	X÷"ó "rW   r  c                   ó8   • \ rS rSrSrSr\" \SS9\\	S.r
S rSrg)	ÚDogePreTrainedModeli5  Fr‰   )Úindex)r  r-   Ú
attentionsc                 óÎ  • [         R                  " U5        [        U[        5      (       a7  [	        US5      (       a%  UR
                  R                  R                  5         gg[        U[        5      (       an  [	        US5      (       a%  UR                  R                  R                  S5        [	        US5      (       a&  UR                  R                  R                  S5        ggg)zInitialize the weightsr¦   r  rÒ   r  N)r   Ú_init_weightsrŠ   r•   Úhasattrr¦   ÚdataÚzero_r  r  Úfill_r  )rR   rp   s     rU   r+  Ú!DogePreTrainedModel._init_weights>  s«   € ä×*Ò*¨6Ô2Üfœm×,Ñ,Üv˜s×#Ñ#Ø—‘—‘×#Ñ#Õ%ð $ä˜Ô 0×1Ñ1ÜvÐ/×0Ñ0Ø×%Ñ%×*Ñ*×0Ñ0°Ô5ÜvÐ8×9Ñ9Ø×.Ñ.×3Ñ3×9Ñ9¸#Õ>ð :ð 2rW   r6   N)r^   r_   r`   ra   Ú_supports_flash_attnÚ_can_compile_fullgraphr   rë   r  r•   Ú_can_record_outputsr+  rg   r6   rW   rU   r'  r'  5  s+   † Ø ÐØ"Ðá'¨	¸Ñ;Ø)Ø#ñÐõ
?rW   r'  c                   ó   • \ rS rSrSrg)Ú	DogeModeliK  r6   Nrl   r6   rW   rU   r5  r5  K  rm   rW   r5  Úgate_logitsrK   rñ   rò   c                 ó¢  • U b  [        U [        5      (       d  gU S   R                  nU S   R                  n/ n/ nU  GH  n	U	R	                  U5      n	U	R                  USS9u  u  p«u  pÍU
R                  S5      UR                  S5      -   nUR                  S5      U-  UR                  S5      -   nUR                  " / UR                  SS QSP76 nUR                  " / UR                  SS QSP76 nUR                  USS9u  nnUR                  SU5      n[        R                  " USS9nUR                  U5        UR                  U5        GM     [        R                  " USS9n[        R                  " USS9nUcu  UR                  S5      n[        R                  " XUS9n[        R                   " XuUS9nUR#                  SUU5      UR                  S   -  n[        R$                  " USS9nGO;UR                  u  nn['        U 5      nUSSS2SS2S4   R)                  UUUU45      R+                  S5      R	                  U5      nUR                  S5      UR-                  5          n[        R                  " XUS9n[        R                   " XuUS9nUR#                  SUU5      [        R.                  " U5      -  nUSSS2SS2S4   R)                  UUUU45      R+                  SU5      R	                  U5      n[        R.                  " UU-  SS9[        R.                  " USS9-  n[        R.                  " UU-  5      nUU-  $ )aœ  
Computes auxiliary load balancing loss as in Switch Transformer - implemented in Pytorch.

See Switch Transformer (https://arxiv.org/abs/2101.03961) for more details. This function implements the loss
function presented in equations (4) - (6) of the paper. It aims at penalizing cases where the routing between
experts is too unbalanced.

Args:
    gate_logits:
        Logits from the `router_gate`, should be a tuple of model.config.num_hidden_layers tensors of
        shape [2, batch_size * sequence_length, num_keys].
    num_experts:
        Number of experts
    num_keys:
        Number of keys
    top_k:
        The number of experts to route per-token, can be also interpreted as the `top-k` routing
        parameter.
    attention_mask (`torch.Tensor`, *optional*):
        The attention_mask used in forward function
        shape [batch_size X sequence_length] if not None.

Returns:
    The auxiliary loss.
Nr   r±   rý   ry   rÎ   )rŠ   ræ   r   rÍ   rŒ   rÛ   rÿ   r·   r‹   r   r»   r  Úappendr{   Úcatr¥   Ú	ones_likeÚscatter_add_ÚmeanÚlenrÕ   r¹   rÖ   r  )r6  rK   rñ   rò   r.   Úcompute_dtypeÚcompute_deviceÚall_expert_indicesÚall_routing_weightsÚlayer_gate_logitsr  r	  r
  r  r  r  r  r  Úexpert_indicesr  Útokens_per_expertÚpadÚrouter_prob_per_expertÚ
batch_sizeÚsequence_lengthr:   Úexpert_attention_maskÚ router_per_expert_attention_maskÚoverall_losss                                rU   Úload_balancing_loss_funcrL  O  si  € ð@ Ñ¤*¨[¼%×"@Ñ"@Øà ‘N×(Ñ(€MØ  ‘^×*Ñ*€NØÐØÐä(ÐØ-×0Ñ0°Ó@Ðà7H×7MÑ7MÈhÐ\^Ð7MÐ7_Ñ4ÑˆÑ4˜yà×'Ñ'¨Ó+¨h×.@Ñ.@ÀÓ.DÑDˆ
Ø×)Ñ)¨"Ó-°Ñ8¸9×;NÑ;NÈrÓ;RÑRˆØ—_’_Ð@ j×&6Ñ&6°s¸Ð&;Ð@¸RÒ@ˆ
Ø!×&Ò&ÐC¨×(9Ñ(9¸#¸2Ð(>ÐCÀÒCˆà(Ÿo™o¨e¸˜oÐ<ÑˆÐØ$×+Ñ+¨BÐ0@ÓAˆäŸ)š) J°BÑ7ˆà×!Ñ! .Ô1Ø×"Ñ" ?×3ñ! )ô" ŸšÐ#5¸1Ñ=ÐÜŸ)š)Ð$7¸QÑ?ÐàÑà/×4Ñ4°RÓ8ÐÜ!ŸKšK¨ÐQ_Ñ`ÐÜoŠoÐ0ÈnÑ]ˆØ-×:Ñ:¸1Ð>PÐRUÓVÐYk×YqÑYqÐrsÑYtÑtÐô "'§¢Ð,?ÀQÑ!GÒà&4×&:Ñ&:Ñ#ˆ
OÜ Ó,Ðð ˜4¢¢A tÐ+Ñ,ß‰VÐ&¨
°OÀUÐKÓLß‰WR‹[ß‰RÓð	 	ð 0×4Ñ4°RÓ8Ð9N×9SÑ9SÓ9UÑVÐô "ŸKšK¨ÐQ_Ñ`ÐÜoŠoÐ0ÈnÑ]ˆØ-×:Ñ:¸1Ð>PÐRUÓVÔY^×YbÒYbØ!óZ
ñ 
Ðð ˜4¢¢A tÐ+Ñ,ß‰VÐ&¨
°OÀ[ÐQÓRß‰WR˜Ó%ß‰RÓð	 	)ô "'§¢Ð+>ÐAaÑ+aÐghÑ!iÔlq×luÒluØ,°!ñm
ñ "
Ðô —9’9Ð.Ð1GÑGÓH€LØ˜+Ñ%Ð%rW   c                   óf  ^ • \ rS rSrU 4S jr          SS\\R                     S\\R                     S\\R                     S\\	\R                        S\\R                     S\\R                     S	\\   S
\\R                     S\\\R                  4   S\\   S\\   S\4S jjrSrU =r$ )ÚDogeForCausalLMi¹  c                 óf   >• [         TU ]  U5        [        U5      U l        UR                  U l        g râ   )rP   rQ   r5  ÚmodelrK   rú   s     €rU   rQ   ÚDogeForCausalLM.__init__º  s*   ø€ Ü‰Ñ˜Ô Ü˜vÓ&ˆŒ
Ø!×-Ñ-ˆÕrW   r+   r.   r  r%   r,   Úlabelsr?   r¯   Úlogits_to_keeprN   rS   rw   c                 óâ  • U
b  U
OU R                   R                  n
U R                  " SUUUUUUUS.UD6nUR                  n[	        U	[
        5      (       a  [        U	* S5      OU	nU R                  USS2USS24   5      nSnUb  U R                  " XöU R                  40 UD6nSnU
(       a  [        UR                  U R                  [        R                  " [        R                  " U R                  5      5      U R                   U5      nUb+  UU R"                  UR%                  UR&                  5      -  -  n[)        UUUUR*                  UR,                  UR.                  UR                  S9$ )aè  
labels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):
    Labels for computing the masked language modeling loss. Indices should either be in `[0, ...,
    config.vocab_size]` or -100 (see `input_ids` docstring). Tokens with indices set to `-100` are ignored
    (masked), the loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`.

Example:

```python
>>> from transformers import AutoTokenizer, DogeForCausalLM

>>> model = DogeForCausalLM.from_pretrained("SmallDoge/Doge-320M")
>>> tokenizer = AutoTokenizer.from_pretrained("SmallDoge/Doge-320M")

>>> prompt = "Hey, are you conscious? Can you talk to me?"
>>> inputs = tokenizer(prompt, return_tensors="pt")

>>> # Generate
>>> generate_ids = model.generate(inputs.input_ids, max_length=30)
>>> tokenizer.batch_decode(generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
"Hey, are you conscious? Can you talk to me?\nI'm not conscious, but I can talk to you."
```N)r+   r.   r  r%   r,   r?   r¯   )ÚlossÚaux_lossÚlogitsr%   r-   r)  r  r6   )r–   rN   rP  Úlast_hidden_staterŠ   rä   ÚsliceÚlm_headÚloss_functionr7   rL  r  rK   rî   rï   rð   rL   rO   rŒ   rÍ   r   r%   r-   r)  )rR   r+   r.   r  r%   r,   rR  r?   r¯   rS  rN   rS   Úoutputsr-   Úslice_indicesrW  rU  rV  s                     rU   rÊ   ÚDogeForCausalLM.forward¿  sm  € ðJ %9Ñ$DÑ È$Ï+É+×JjÑJjð 	ð
 +/¯*ª*ð 	+
ØØ)Ø%Ø+Ø'ØØ)ñ	+
ð ñ	+
ˆð  ×1Ñ1ˆä8BÀ>ÔSV×8WÑ8Wœ˜~˜o¨tÔ4Ð]kˆØ—‘˜mªA¨}ºaÐ,?Ñ@ÓAˆàˆØÑØ×%Ò% f°d·o±oÑPÈÑPˆDàˆÞÜ/Ø×%Ñ%Ø× Ñ Ü—
’
œ4Ÿ9š9 T×%5Ñ%5Ó6Ó7Ø×(Ñ(ØóˆHð Ñ!Ø˜×1Ñ1°H·K±KÀÇÁÓ4LÑLÑLä(ØØØØ#×3Ñ3Ø!×/Ñ/Ø×)Ñ)Ø!×/Ñ/ñ
ð 	
rW   )rP  rK   )
NNNNNNNNr   N)r^   r_   r`   ra   rQ   r   r{   rç   rå   Úlistr%  rÖ   r   rä   r   r   r   rÊ   rg   rh   ri   s   @rU   rN  rN  ¹  s"  ø† õ.ð 15Ø15Ø37Ø=AØ59Ø-1Ø$(Ø59Ø34Ø/3ñQ
à˜E×,Ñ,Ñ-ðQ
ð ! §¡Ñ.ðQ
ð ˜u×/Ñ/Ñ0ð	Q
ð
 " $ u×'8Ñ'8Ñ"9Ñ:ðQ
ð   × 1Ñ 1Ñ2ðQ
ð ˜×)Ñ)Ñ*ðQ
ð ˜D‘>ðQ
ð ! ×!1Ñ!1Ñ2ðQ
ð ˜c 5§<¡<Ð/Ñ0ðQ
ð ' t™nðQ
ð Ð+Ñ,ðQ
ð 
#÷Q
ó Q
rW   rN  c                   ó   • \ rS rSrSrg)ÚDogeForSequenceClassificationi  r6   Nrl   r6   rW   rU   ra  ra    rm   rW   ra  )r"   rN  r5  r'  ra  rã   )NNr   N)Erb   rî   Útypingr   r   r   r{   Útorch.nn.functionalr   Ú
functionalr»   Úactivationsr   Úcache_utilsr	   Úconfiguration_utilsr
   Úintegrations.flex_attentionr   Úmodeling_layersr   Úmodeling_outputsr   r   Úmodeling_rope_utilsr   Úmodeling_utilsr   Úprocessing_utilsr   Úutilsr   r   Úutils.genericr   Úllama.modeling_llamar   r   r   r   r   r   r   r   Úmixtral.modeling_mixtralr   r   Ú!torch.nn.attention.flex_attentionr    r"   rk   ro   ÚModulerå   Úfloatræ   r’   r¿   r•   ré   rë   r  r'  r5  rä   rL  rN  ra  Ú__all__r6   rW   rU   Ú<module>rv     sQ  ðñ" ã ß ,Ñ ,ã ß Ð Ý å !Ý  Ý 3Ý JÝ 9ß QÝ 9Ý 0Ý &ß EÝ +÷	÷ 	ó 	÷ Hñ  ×!Ñ!Ý;ôS
Ð!ô S
ôl	,ô 	ô	Ð.ô 	ð  $Ø#Ø(,ñ.*ØI‰Ið.*à<‰<ð.*ð 
‰ð.*ð <‰<ð	.*ð
 ˜%Ÿ,™,¨Ð3Ñ4ð.*ð e‰_ð.*ð e‰_ð.*ð ˜Ÿ™Ñ%ð.*ð ˆ5<‰<˜Ÿ™Ð%Ñ&õ.*ñb -Ó.Ð Ø1GÐ Ð-Ñ .ôzB—I‘Iô zôz	ˆhô 	ô6,—	‘	ô 6,ôr/Ð1ô /ôd?Ð.ô ?ô,	ô 	ð "&Ø"ØØ-1ñg&Øu—|‘| U¨5¯<©<Ñ%8¸$Ð>Ñ?ðg&à˜#‘ðg&ð s‰mðg&ð ð	g&ð
 ˜UŸ\™\Ñ*ðg&ð ˆ5<‰<˜ÐÑõg&ôTW
Ð(ô W
ôt	Ð$Bô 	òrW   