ó
    <±h  ã                   ó0   • S r SSKJr   " S S\5      rS/rg)zVJEPA 2 model configurationé   )ÚPretrainedConfigc                   ób   ^ • \ rS rSrSrSr                       SU 4S jjrSrU =r$ )ÚVJEPA2Configé   a«  
This is the configuration class to store the configuration of a [`VJEPA2Model`]. It is used to instantiate an
VJEPA2 model according to the specified arguments, defining the model architecture. Instantiating a configuration
with the defaults will yield a similar configuration to that of the VJEPA2
[facebook/vjepa2-vitl-fpc64-256](https://huggingface.co/facebook/vjepa2-vitl-fpc64-256) architecture.

Configuration objects inherit from [`PretrainedConfig`] and can be used to control the model outputs. Read the
documentation from [`PretrainedConfig`] for more information.

Args:
    patch_size (`int`, *optional*, defaults to 16):
        The size (resolution) of each patch.
    crop_size (`int`, *optional*, defaults to 256):
        Input resolution of the model
    frames_per_clip (`int`, *optional*, defaults to 64):
        The number of frames the model has been pretrained with. Does not impact inference.
    tubelet_size (`int`, *optional*, defaults to 2):
        The number of temporal frames used for a single rastor, check paper for more information.
    hidden_size (`int`, *optional*, defaults to 1024):
        Dimensionality of the encoder layers
    in_chans (`int`, *optional*, defaults to 3):
        The number of input channels
    num_attention_heads (`int`, *optional*, defaults to 16):
        Number of attention heads for each attention layer in the Encoder
    num_hidden_layers (`int`, *optional*, defaults to 24):
        The number of hidden layers
    drop_path_rate (`float`, *optional*, defaults to 0.0):
        Stochastic depth rate per sample (when applied in the main path of residual layers).
    mlp_ratio (`float`, *optional*, defaults to 4.0):
        Ratio of the hidden size of the MLPs used in Encoder relative to the `hidden_size`.
    layer_norm_eps (`float`, *optional*, defaults to 1e-06):
        The epsilon used by the layer normalization layers.
    qkv_bias (`bool`, *optional*, defaults to `True`):
        Whether to add a bias to the queries, keys and values.
    attention_probs_dropout_prob (`float`, *optional*, defaults to 0.0):
        The dropout probability for attentions.
        The dropout probability for all fully connected layers.
    hidden_act (`str`, *optional*, defaults to `"gelu"`):
        The non-linear activation function (function or string) in the encoder and pooler. If string, `"gelu"`,
        `"relu"`, `"selu"` and `"gelu_new"` are supported.
    initializer_range (`float`, *optional*, defaults to 0.02):
        The standard deviation of the truncated_normal_initializer for initializing all weight matrices.
    attention_dropout (`float`, *optional*, defaults to 0.0):
        The dropout probability for attentions.
    num_pooler_layers (`int`, *optional*, defaults to 3):
        The number of self-attention layers in the pooler.
    pred_hidden_size (`int`, *optional*, defaults to 384):
        Dimensionality of the predictor layers
    pred_num_attention_heads (`int`, *optional*, defaults to 12):
        Number of attention heads for each attention layer in the Predictor
    pred_num_hidden_layers (`int`, *optional*, defaults to 12):
        Number of hidden layers in the Predictor
    pred_num_mask_tokens (`int`, *optional*, defaults to 10):
        Define the number of mask tokens to use in the Predictor
    pred_zero_init_mask_tokens (`bool`, *optional*, defaults to `True`):
        Initialize the mask tokens in the predictor with 0.
    pred_mlp_ratio (`float`, *optional*, defaults to 4.0):
        Ratio of the hidden size of the MLPs used in Predictor relative to the `pred_hidden_size`.

Example:

```python
>>> from transformers import VJEPA2Config, VJEPA2Model

>>> # Initializing a VJEPA2 vjepa2-vitl-fpc64-256 style configuration
>>> configuration = VJEPA2Config()

>>> # Initializing a model (with random weights) from the vjepa2-vitl-fpc64-256  style configuration
>>> model = VJEPA2Model(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```Úvjepa2c                 óV  >• [         TU ]  " S0 UD6  X l        X0l        Xl        X@l        XPl        X`l        Xpl        X€l	        Xl
        X l        X°l        XÀl        XÐl        Xàl        Xðl        X l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        UU l        g )N© )ÚsuperÚ__init__Ú	crop_sizeÚframes_per_clipÚ
patch_sizeÚtubelet_sizeÚhidden_sizeÚin_chansÚnum_attention_headsÚnum_hidden_layersÚdrop_path_rateÚ	mlp_ratioÚlayer_norm_epsÚqkv_biasÚattention_probs_dropout_probÚ
hidden_actÚinitializer_rangeÚ
image_sizeÚattention_dropoutÚnum_pooler_layersÚpred_hidden_sizeÚpred_num_attention_headsÚpred_num_hidden_layersÚpred_num_mask_tokensÚpred_zero_init_mask_tokensÚpred_mlp_ratio)Úselfr   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r    r!   r"   r#   ÚkwargsÚ	__class__s                            €Úg/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/vjepa2/configuration_vjepa2.pyr   ÚVJEPA2Config.__init__a   s®   ø€ ô8 	‰ÒÑ"˜6Ò"à"ŒØ.ÔØ$ŒØ(ÔØ&ÔØ ŒØ#6Ô Ø!2ÔØ,ÔØ"ŒØ,ÔØ ŒØ,HÔ)Ø$ŒØ!2ÔØ#ŒØ!2ˆÔØ!2ˆÔà 0ˆÔØ(@ˆÔ%Ø&<ˆÔ#Ø$8ˆÔ!Ø*DˆÔ'Ø,ˆÕó    )r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r#   r   r    r!   r"   r   r   )é   é   é@   é   i   r   r*   é   ç        ç      @gíµ ÷Æ°>Tr/   Úgelug{®Gáz”?r/   r   i€  é   r2   é
   Tr0   )	Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Ú
model_typer   Ú__static_attributes__Ú__classcell__)r&   s   @r'   r   r      sb   ø† ñHðT €Jð ØØØØØØØØØØØØ%(ØØØØàØ!#Ø!ØØ#'Ø÷36-õ 6-r)   r   N)r8   Úconfiguration_utilsr   r   Ú__all__r	   r)   r'   Ú<module>r>      s'   ðñ "å 3ôC-Ð#ô C-ðL Ð
r)   