ó
    <±hq%  ã                   óÄ   • S r SSKrSSKJr  SSKJr  SSKJrJr  SSK	J
r
Jr  SSKJrJr  SS	KJrJrJr  \R&                  " \5      r " S
 S\
5      r " S S\5      rSS/rg)zLayoutLM model configurationé    N©ÚOrderedDict)ÚMapping)ÚAnyÚOptionalé   )ÚPretrainedConfigÚPreTrainedTokenizer)Ú
OnnxConfigÚPatchingSpec)Ú
TensorTypeÚis_torch_availableÚloggingc                   óˆ   ^ • \ rS rSrSrSr                SU 4S jjr\S 5       r\R                  S 5       rSr
U =r$ )	ÚLayoutLMConfigé   aé  
This is the configuration class to store the configuration of a [`LayoutLMModel`]. It is used to instantiate a
LayoutLM model according to the specified arguments, defining the model architecture. Instantiating a configuration
with the defaults will yield a similar configuration to that of the LayoutLM
[microsoft/layoutlm-base-uncased](https://huggingface.co/microsoft/layoutlm-base-uncased) architecture.

Configuration objects inherit from [`BertConfig`] and can be used to control the model outputs. Read the
documentation from [`BertConfig`] for more information.


Args:
    vocab_size (`int`, *optional*, defaults to 30522):
        Vocabulary size of the LayoutLM model. Defines the different tokens that can be represented by the
        *inputs_ids* passed to the forward method of [`LayoutLMModel`].
    hidden_size (`int`, *optional*, defaults to 768):
        Dimensionality of the encoder layers and the pooler layer.
    num_hidden_layers (`int`, *optional*, defaults to 12):
        Number of hidden layers in the Transformer encoder.
    num_attention_heads (`int`, *optional*, defaults to 12):
        Number of attention heads for each attention layer in the Transformer encoder.
    intermediate_size (`int`, *optional*, defaults to 3072):
        Dimensionality of the "intermediate" (i.e., feed-forward) layer in the Transformer encoder.
    hidden_act (`str` or `function`, *optional*, defaults to `"gelu"`):
        The non-linear activation function (function or string) in the encoder and pooler. If string, `"gelu"`,
        `"relu"`, `"silu"` and `"gelu_new"` are supported.
    hidden_dropout_prob (`float`, *optional*, defaults to 0.1):
        The dropout probability for all fully connected layers in the embeddings, encoder, and pooler.
    attention_probs_dropout_prob (`float`, *optional*, defaults to 0.1):
        The dropout ratio for the attention probabilities.
    max_position_embeddings (`int`, *optional*, defaults to 512):
        The maximum sequence length that this model might ever be used with. Typically set this to something large
        just in case (e.g., 512 or 1024 or 2048).
    type_vocab_size (`int`, *optional*, defaults to 2):
        The vocabulary size of the `token_type_ids` passed into [`LayoutLMModel`].
    initializer_range (`float`, *optional*, defaults to 0.02):
        The standard deviation of the truncated_normal_initializer for initializing all weight matrices.
    layer_norm_eps (`float`, *optional*, defaults to 1e-12):
        The epsilon used by the layer normalization layers.
    pad_token_id (`int`, *optional*, defaults to 0):
        The value used to pad input_ids.
    position_embedding_type (`str`, *optional*, defaults to `"absolute"`):
        Type of position embedding. Choose one of `"absolute"`, `"relative_key"`, `"relative_key_query"`. For
        positional embeddings use `"absolute"`. For more information on `"relative_key"`, please refer to
        [Self-Attention with Relative Position Representations (Shaw et al.)](https://huggingface.co/papers/1803.02155).
        For more information on `"relative_key_query"`, please refer to *Method 4* in [Improve Transformer Models
        with Better Relative Position Embeddings (Huang et al.)](https://huggingface.co/papers/2009.13658).
    use_cache (`bool`, *optional*, defaults to `True`):
        Whether or not the model should return the last key/values attentions (not used by all models). Only
        relevant if `config.is_decoder=True`.
    max_2d_position_embeddings (`int`, *optional*, defaults to 1024):
        The maximum value that the 2D position embedding might ever used. Typically set this to something large
        just in case (e.g., 1024).

Examples:

```python
>>> from transformers import LayoutLMConfig, LayoutLMModel

>>> # Initializing a LayoutLM configuration
>>> configuration = LayoutLMConfig()

>>> # Initializing a model (with random weights) from the configuration
>>> model = LayoutLMModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```Úlayoutlmc                 óà   >• [         TU ]  " SSU0UD6  Xl        X l        X0l        X@l        X`l        XPl        Xpl        X€l	        Xl
        X l        X°l        XÀl        Xàl        Xðl        UU l        g )NÚpad_token_id© )ÚsuperÚ__init__Ú
vocab_sizeÚhidden_sizeÚnum_hidden_layersÚnum_attention_headsÚ
hidden_actÚintermediate_sizeÚhidden_dropout_probÚattention_probs_dropout_probÚmax_position_embeddingsÚtype_vocab_sizeÚinitializer_rangeÚlayer_norm_epsÚ_position_embedding_typeÚ	use_cacheÚmax_2d_position_embeddings)Úselfr   r   r   r   r   r   r   r    r!   r"   r#   r$   r   Úposition_embedding_typer&   r'   ÚkwargsÚ	__class__s                     €Úk/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/models/layoutlm/configuration_layoutlm.pyr   ÚLayoutLMConfig.__init__e   ss   ø€ ô( 	‰ÒÑ= lÐ=°fÒ=Ø$ŒØ&ÔØ!2ÔØ#6Ô Ø$ŒØ!2ÔØ#6Ô Ø,HÔ)Ø'>Ô$Ø.ÔØ!2ÔØ,ÔØ(?Ô%Ø"ŒØ*DˆÕ'ó    c                 óP   • [         R                  " S[        5        U R                  $ )NzSThe `position_embedding_type` attribute is deprecated and will be removed in v4.55.)ÚwarningsÚwarnÚFutureWarningr%   ©r(   s    r,   r)   Ú&LayoutLMConfig.position_embedding_typeŠ   s"   € äŠØaÜô	
ð ×,Ñ,Ð,r.   c                 ó   • Xl         g )N)r%   )r(   Úvalues     r,   r)   r4   ’   s   € à(-Õ%r.   )r%   r    r   r   r   r#   r   r$   r'   r!   r   r   r"   r&   r   )i:w  i   é   r7   i   Úgeluçš™™™™™¹?r9   i   é   g{®Gáz”?gê-™—q=r   ÚabsoluteTi   )Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Ú
model_typer   Úpropertyr)   ÚsetterÚ__static_attributes__Ú__classcell__©r+   s   @r,   r   r      sx   ø† ñBðH €Jð ØØØØØØØ%(Ø #ØØØØØ *ØØ#'÷##EðJ ñ-ó ð-ð ×#Ñ#ñ.ó $ö.r.   r   c                   ó¼   ^ • \ rS rSr  SS\S\S\\\      4U 4S jjjr	\
S\\\\\4   4   4S j5       r    SS\S	\S
\S\S\\   S\\\4   4U 4S jjjrSrU =r$ )ÚLayoutLMOnnxConfigé—   ÚconfigÚtaskÚpatching_specsc                 óJ   >• [         TU ]  XUS9  UR                  S-
  U l        g )N)rK   rL   é   )r   r   r'   Úmax_2d_positions)r(   rJ   rK   rL   r+   s       €r,   r   ÚLayoutLMOnnxConfig.__init__˜   s*   ø€ ô 	‰Ñ˜¸>ÐÑJØ &× AÑ AÀAÑ EˆÕr.   Úreturnc           	      óH   • [        SSSS.4SSSS.4SSSS.4SSSS.4/5      $ )NÚ	input_idsÚbatchÚsequence)r   rN   ÚbboxÚattention_maskÚtoken_type_idsr   r3   s    r,   ÚinputsÚLayoutLMOnnxConfig.inputs¡   sH   € äà '¨jÑ9Ð:Ø˜W¨Ñ4Ð5Ø! w°:Ñ#>Ð?Ø! w°:Ñ#>Ð?ð	ó
ð 	
r.   Ú	tokenizerÚ
batch_sizeÚ
seq_lengthÚis_pairÚ	frameworkc                 ó   >• [         T	U ]  XX4US9n/ SQnU[        R                  :X  d  [	        S5      e[        5       (       d  [        S5      eSSKnUS   R                  u  p#UR                  / U/U-  Q5      R                  USS5      US	'   U$ )
a>  
Generate inputs to provide to the ONNX exporter for the specific framework

Args:
    tokenizer: The tokenizer associated with this model configuration
    batch_size: The batch size (int) to export the model for (-1 means dynamic axis)
    seq_length: The sequence length (int) to export the model for (-1 means dynamic axis)
    is_pair: Indicate if the input is a pair (sentence 1, sentence 2)
    framework: The framework (optional) the tokenizer will generate tensor for

Returns:
    Mapping[str, Tensor] holding the kwargs to provide to the model's forward function
)r\   r]   r^   r_   )é0   éT   éI   é€   zCExporting LayoutLM to ONNX is currently only supported for PyTorch.z7Cannot generate dummy inputs without PyTorch installed.r   NrS   rN   rV   )r   Úgenerate_dummy_inputsr   ÚPYTORCHÚNotImplementedErrorr   Ú
ValueErrorÚtorchÚshapeÚtensorÚtile)
r(   r[   r\   r]   r^   r_   Ú
input_dictÚboxri   r+   s
            €r,   re   Ú(LayoutLMOnnxConfig.generate_dummy_inputs¬   s¤   ø€ ô, ‘WÑ2Ø¸Ð`ið 3ð 
ˆ
ò
  ˆàœJ×.Ñ.Ó.Ü%Ð&kÓlÐlä!×#Ñ#ÜÐVÓWÐWÛà!+¨KÑ!8×!>Ñ!>Ñˆ
Ø"Ÿ\™\Ð*?¨S¨E°JÑ,>Ð*?Ó@×EÑEÀjÐRSÐUVÓWˆ
6ÑØÐr.   )rO   )ÚdefaultN)éÿÿÿÿrq   FN)r<   r=   r>   r?   r	   Ústrr   Úlistr   r   rB   r   ÚintrY   r
   Úboolr   r   re   rD   rE   rF   s   @r,   rH   rH   —   sÎ   ø† ð Ø7;ñ	Fà ðFð ðFð !  lÑ!3Ñ4÷	Fð Fð ð
˜  W¨S°#¨XÑ%6Ð 6Ñ7ó 
ó ð
ð ØØØ*.ñ&à&ð&ð ð&ð ð	&ð
 ð&ð ˜JÑ'ð&ð 
cÑ	÷&ö &r.   rH   )r@   r0   Úcollectionsr   Úcollections.abcr   Útypingr   r   Ú r	   r
   Úonnxr   r   Úutilsr   r   r   Ú
get_loggerr<   Úloggerr   rH   Ú__all__r   r.   r,   Ú<module>r      s^   ðñ #ã Ý #Ý #ß  ç 5ß ,ß <Ñ <ð 
×	Ò	˜HÓ	%€ôv.Ð%ô v.ôr;˜ô ;ð| Ð1Ð
2r.   