ó
    <±hÐI  ã                   óž  • S SK r S SKrS SKJrJr  SSKJr  SSKJr  SSK	J
r
JrJrJr  SSKJrJr  \" 5       (       a
  S SKrSS	KJr  \" 5       (       a  SS
KJr  \R.                  " \5      r " S S\ R4                  5      r\
" \" SS95       " S S\5      5       r\
" \" SS95       " S S\5      5       r\
" \" SS95       " S S\5      5       rg)é    N)ÚAnyÚUnioné   )ÚGenerationConfig)ÚTruncationStrategy)Úadd_end_docstringsÚis_tf_availableÚis_torch_availableÚloggingé   )ÚPipelineÚbuild_pipeline_init_args)Ú/TF_MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMES)Ú,MODEL_FOR_SEQ_TO_SEQ_CAUSAL_LM_MAPPING_NAMESc                   ó   • \ rS rSrSrSrSrg)Ú
ReturnTypeé   r   r   © N)Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__ÚTENSORSÚTEXTÚ__static_attributes__r   ó    Úc/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/pipelines/text2text_generation.pyr   r      s   † Ø€GØƒDr   r   T)Úhas_tokenizerc            	       ó  ^ • \ rS rSrSrSrSrSrSrSr	\
" SSS9rSrU 4S	 jr      SS
 jrS\S\S\4S jrS rS\\\\   4   S\S\\\\4      4U 4S jjr\R2                  4S jrS r\R:                  S4S jrSrU =r $ )ÚText2TextGenerationPipelineé   aÁ  
Pipeline for text to text generation using seq2seq models.

Unless the model you're using explicitly sets these generation parameters in its configuration files
(`generation_config.json`), the following default values will be used:
- max_new_tokens: 256
- num_beams: 4

Example:

```python
>>> from transformers import pipeline

>>> generator = pipeline(model="mrm8488/t5-base-finetuned-question-generation-ap")
>>> generator(
...     "answer: Manuel context: Manuel has created RuPERTa-base with the support of HF-Transformers and Google"
... )
[{'generated_text': 'question: Who created the RuPERTa-base?'}]
```

Learn more about the basics of using a pipeline in the [pipeline tutorial](../pipeline_tutorial). You can pass text
generation parameters to this pipeline to control stopping criteria, decoding strategy, and more. Learn more about
text generation parameters in [Text generation strategies](../generation_strategies) and [Text
generation](text_generation).

This Text2TextGenerationPipeline pipeline can currently be loaded from [`pipeline`] using the following task
identifier: `"text2text-generation"`.

The models that this pipeline can use are models that have been fine-tuned on a translation task. See the
up-to-date list of available models on
[huggingface.co/models](https://huggingface.co/models?filter=text2text-generation). For a list of available
parameters, see the [following
documentation](https://huggingface.co/docs/transformers/en/main_classes/text_generation#transformers.generation.GenerationMixin.generate)

Usage:

```python
text2text_generator = pipeline("text2text-generation")
text2text_generator("question: What is 42 ? context: 42 is the answer to life, the universe and everything")
```TFé   é   )Úmax_new_tokensÚ	num_beamsÚ	generatedc                 ó†   >• [         TU ]  " U0 UD6  U R                  U R                  S:X  a  [        5        g [
        5        g )NÚtf)ÚsuperÚ__init__Úcheck_model_typeÚ	frameworkr   r   ©ÚselfÚargsÚkwargsÚ	__class__s      €r   r*   Ú$Text2TextGenerationPipeline.__init__T   s>   ø€ Ü‰Ò˜$Ð) &Ò)à×Ñà~‰~ Ó%ô <õ	
ô >õ	
r   c                 ó¼  • 0 nUb  XXS'   Un	0 n
Ub*  Uc'  U(       a  [         R                  O[         R                  nUb  X:S'   Ub  XJS'   UbG  U R                  R	                  USS9n[        U5      S:”  a  [        R                  " S5        US   US	'   U R                  b  U R                  U	S
'   U R                  b  U R                  U	S'   U R                  U	S'   X‰U
4$ )NÚ
truncationÚreturn_typeÚclean_up_tokenization_spacesF)Úadd_special_tokensr   z©Stopping on a multiple token sequence is not yet supported on transformers. The first token of the stop sequence will be used as the stop sequence string in the interim.r   Úeos_token_idÚassistant_modelÚ	tokenizerÚassistant_tokenizer)
r   r   r   r:   ÚencodeÚlenÚwarningsÚwarnr9   r;   )r.   Úreturn_tensorsÚreturn_textr5   r6   r4   Ústop_sequenceÚgenerate_kwargsÚpreprocess_paramsÚforward_paramsÚpostprocess_paramsÚstop_sequence_idss               r   Ú_sanitize_parametersÚ0Text2TextGenerationPipeline._sanitize_parameters]   s  € ð ÐØÑ!Ø.8˜lÑ+à(ˆàÐØÑ%¨+Ñ*=Þ0>œ*×,Ò,ÄJÇOÁOˆKØÑ"Ø0;˜}Ñ-à'Ñ3ØA]Ð=Ñ>àÑ$Ø $§¡× 5Ñ 5°mÐX]Ð 5Ð ^ÐÜÐ$Ó%¨Ó)Ü—’ðbôð /@ÀÑ.BˆO˜NÑ+à×ÑÑ+Ø04×0DÑ0DˆNÐ,Ñ-Ø×#Ñ#Ñ/Ø*.¯.©.ˆN˜;Ñ'Ø48×4LÑ4LˆNÐ0Ñ1à Ð2DÐDÐDr   Úinput_lengthÚ
min_lengthÚ
max_lengthc                 ó   • g)úZ
Checks whether there might be something wrong with given input with regard to the model.
Tr   ©r.   rJ   rK   rL   s       r   Úcheck_inputsÚ(Text2TextGenerationPipeline.check_inputs‡   s   € ð r   c                ó¤  • U R                   b  U R                   OSn[        US   [        5      (       a=  U R                  R                  c  [        S5      eUS    Vs/ sH  oCU-   PM	     sn4nSnO5[        US   [        5      (       a  X2S   -   4nSnO[        SUS    S35      eU R                  " X%XR                  S.6nS	U;   a  US		 U$ s  snf )
NÚ r   zOPlease make sure that the tokenizer has a pad_token_id when using a batch inputTFz `args[0]`: zI have the wrong format. The should be either of type `str` or type `list`)Úpaddingr4   r@   Útoken_type_ids)	ÚprefixÚ
isinstanceÚlistr:   Úpad_token_idÚ
ValueErrorÚstrÚ	TypeErrorr,   )r.   r4   r/   rV   ÚargrT   Úinputss          r   Ú_parse_and_tokenizeÚ/Text2TextGenerationPipeline._parse_and_tokenize   sÛ   € Ø $§¡Ñ 7—’¸RˆÜd˜1‘gœt×$Ñ$Ø~‰~×*Ñ*Ñ2Ü Ð!rÓsÐsØ-1°!ªWÓ5©W c˜c”\©WÑ5Ð7ˆDØ‰Gä˜˜Q™¤×%Ñ%Ø !™WÑ$Ð&ˆDØ‰GäØ˜t A™w˜iÐ'pÐqóð ð —’ À:×^lÑ^lÒmˆà˜vÓ%ØÐ'Ð(Øˆùò 6s   ÁCr/   r0   Úreturnc                 óì   >• [         TU ]  " U0 UD6n[        US   [        5      (       aE  [	        S US    5       5      (       a+  [	        S U 5       5      (       a  U Vs/ sH  oDS   PM	     sn$ U$ s  snf )aâ  
Generate the output text(s) using text(s) given as inputs.

Args:
    args (`str` or `list[str]`):
        Input text for the encoder.
    return_tensors (`bool`, *optional*, defaults to `False`):
        Whether or not to include the tensors of predictions (as token indices) in the outputs.
    return_text (`bool`, *optional*, defaults to `True`):
        Whether or not to include the decoded texts in the outputs.
    clean_up_tokenization_spaces (`bool`, *optional*, defaults to `False`):
        Whether or not to clean up the potential extra spaces in the text output.
    truncation (`TruncationStrategy`, *optional*, defaults to `TruncationStrategy.DO_NOT_TRUNCATE`):
        The truncation strategy for the tokenization within the pipeline. `TruncationStrategy.DO_NOT_TRUNCATE`
        (default) will never truncate, but it is sometimes desirable to truncate the input to fit the model's
        max_length instead of throwing an error down the line.
    generate_kwargs:
        Additional keyword arguments to pass along to the generate method of the model (see the generate method
        corresponding to your framework [here](./text_generation)).

Return:
    A list or a list of list of `dict`: Each result comes as a dictionary with the following keys:

    - **generated_text** (`str`, present when `return_text=True`) -- The generated text.
    - **generated_token_ids** (`torch.Tensor` or `tf.Tensor`, present when `return_tensors=True`) -- The token
      ids of the generated text.
r   c              3   ó@   #   • U H  n[        U[        5      v •  M     g 7f)N)rW   r[   )Ú.0Úels     r   Ú	<genexpr>Ú7Text2TextGenerationPipeline.__call__.<locals>.<genexpr>Â   s   é € Ð:±'¨B”J˜r¤3×'Ð'²'ùs   ‚c              3   ó<   #   • U H  n[        U5      S :H  v •  M     g7f)r   N)r=   )rd   Úress     r   rf   rg   Ã   s   é € Ð4©V c”C˜“H –MªVùs   ‚)r)   Ú__call__rW   rX   Úall)r.   r/   r0   Úresultri   r1   s        €r   rj   Ú$Text2TextGenerationPipeline.__call__¢   sq   ø€ ô: ‘Ò! 4Ð2¨6Ñ2ˆät˜A‘w¤×%Ñ%ÜÑ:°$°q²'Ó:×:Ñ:ÜÑ4©VÓ4×4Ñ4á&,Ó-¡f˜s˜”F¡fÑ-Ð-Øˆùò .s   ÁA1c                 ó0   • U R                   " U4SU0UD6nU$ )Nr4   )r_   )r.   r^   r4   r0   s       r   Ú
preprocessÚ&Text2TextGenerationPipeline.preprocessÈ   s!   € Ø×)Ò)¨&ÑR¸ZÐRÈ6ÑRˆØˆr   c                 óÞ  • U R                   S:X  a  US   R                  u  p4O9U R                   S:X  a)  [        R                  " US   5      R                  5       u  p4U R	                  WUR                  SU R                  R                  5      UR                  SU R                  R                  5      5        SU;  a  U R                  US'   U R                  R                  " S
0 UDUD6nUR                  S   nU R                   S:X  a'  UR                  " WXc-  /UR                  SS  Q76 nS	U0$ U R                   S:X  a+  [        R                  " UWXc-  /UR                  SS  Q75      nS	U0$ )NÚptÚ	input_idsr(   rK   rL   Úgeneration_configr   r   Ú
output_idsr   )r,   Úshaper(   ÚnumpyrP   Úgetrt   rK   rL   ÚmodelÚgenerateÚreshape)r.   Úmodel_inputsrC   Úin_brJ   ru   Úout_bs          r   Ú_forwardÚ$Text2TextGenerationPipeline._forwardÌ   sc  € Ø>‰>˜TÓ!Ø!-¨kÑ!:×!@Ñ!@ÑˆD,Ø^‰^˜tÓ#Ü!#§¢¨,°{Ñ*CÓ!D×!JÑ!JÓ!LÑˆDà×ÑØØ×Ñ ¨d×.DÑ.D×.OÑ.OÓPØ×Ñ ¨d×.DÑ.D×.OÑ.OÓPô	
ð  oÓ5Ø37×3IÑ3IˆOÐ/Ñ0à—Z‘Z×(Ò(ÑK¨<ÐK¸?ÑKˆ
Ø× Ñ  Ñ#ˆØ>‰>˜TÓ!Ø#×+Ò+¨D°%±-ÐWÀ*×BRÑBRÐSTÐSUÐBVÒWˆJð ˜jÐ)Ð)ð ^‰^˜tÓ#ÜŸš J°°u±}Ð0\Àz×GWÑGWÐXYÐXZÐG[Ñ0\Ó]ˆJØ˜jÐ)Ð)r   c                 ó  • / nUS   S    Hx  nU[         R                  :X  a  U R                   S3U0nO>U[         R                  :X  a*  U R                   S3U R                  R                  USUS90nUR                  W5        Mz     U$ )Nru   r   Ú
_token_idsÚ_textT)Úskip_special_tokensr6   )r   r   Úreturn_namer   r:   ÚdecodeÚappend)r.   Úmodel_outputsr5   r6   Úrecordsru   Úrecords          r   ÚpostprocessÚ'Text2TextGenerationPipeline.postprocessä   sš   € ØˆØ'¨Ñ5°aÔ8ˆJØœj×0Ñ0Ó0Ø!×-Ñ-Ð.¨jÐ9¸:ÐF‘Ø¤
§¡Ó/à×'Ñ'Ð(¨Ð.°·±×0EÑ0EØ"Ø,0Ø5Qð 1Fð 1ðð N‰N˜6Ö"ñ 9ð ˆr   r   )NNNNNN)!r   r   r   r   Ú__doc__Ú_pipeline_calls_generateÚ_load_processorÚ_load_image_processorÚ_load_feature_extractorÚ_load_tokenizerr   Ú_default_generation_configr…   r*   rH   ÚintrP   r_   r   r[   rX   r   Údictrj   r   ÚDO_NOT_TRUNCATEro   r   r   r   r‹   r   Ú__classcell__©r1   s   @r   r    r       sâ   ø† ñ'ðR  $ÐØ€OØ!ÐØ#ÐØ€Oá!1ØØñ"Ðð €Kõ
ð ØØØ%)ØØô(EðT¨ð ¸#ð È3ô òð*$˜e C¨¨c© NÑ3ð $¸sð $ÀtÈDÐQTÐVYÐQYÉNÑG[÷ $ðL -?×,NÑ,Nô ò*ð0 6@·_±_Ðch÷ ò r   r    c                   óJ   ^ • \ rS rSrSrSrU 4S jrS\S\S\S\4S	 jr	S
r
U =r$ )ÚSummarizationPipelineéõ   a/  
Summarize news articles and other documents.

This summarizing pipeline can currently be loaded from [`pipeline`] using the following task identifier:
`"summarization"`.

The models that this pipeline can use are models that have been fine-tuned on a summarization task, which is
currently, '*bart-large-cnn*', '*google-t5/t5-small*', '*google-t5/t5-base*', '*google-t5/t5-large*', '*google-t5/t5-3b*', '*google-t5/t5-11b*'. See the up-to-date
list of available models on [huggingface.co/models](https://huggingface.co/models?filter=summarization). For a list
of available parameters, see the [following
documentation](https://huggingface.co/docs/transformers/en/main_classes/text_generation#transformers.generation.GenerationMixin.generate)

Unless the model you're using explicitly sets these generation parameters in its configuration files
(`generation_config.json`), the following default values will be used:
- max_new_tokens: 256
- num_beams: 4

Usage:

```python
# use bart in pytorch
summarizer = pipeline("summarization")
summarizer("An apple a day, keeps the doctor away", min_length=5, max_length=20)

# use t5 in tf
summarizer = pipeline("summarization", model="google-t5/t5-base", tokenizer="google-t5/t5-base", framework="tf")
summarizer("An apple a day, keeps the doctor away", min_length=5, max_length=20)
```Úsummaryc                 ó$   >• [         TU ]  " U0 UD6$ )a~  
Summarize the text(s) given as inputs.

Args:
    documents (*str* or `list[str]`):
        One or several articles (or one list of articles) to summarize.
    return_text (`bool`, *optional*, defaults to `True`):
        Whether or not to include the decoded texts in the outputs
    return_tensors (`bool`, *optional*, defaults to `False`):
        Whether or not to include the tensors of predictions (as token indices) in the outputs.
    clean_up_tokenization_spaces (`bool`, *optional*, defaults to `False`):
        Whether or not to clean up the potential extra spaces in the text output.
    generate_kwargs:
        Additional keyword arguments to pass along to the generate method of the model (see the generate method
        corresponding to your framework [here](./text_generation)).

Return:
    A list or a list of list of `dict`: Each result comes as a dictionary with the following keys:

    - **summary_text** (`str`, present when `return_text=True`) -- The summary of the corresponding input.
    - **summary_token_ids** (`torch.Tensor` or `tf.Tensor`, present when `return_tensors=True`) -- The token
      ids of the summary.
©r)   rj   r-   s      €r   rj   ÚSummarizationPipeline.__call__  s   ø€ ô0 ‰wÒ Ð0¨Ñ0Ð0r   rJ   rK   rL   ra   c           	      ó–   • X2:  a  [         R                  SU SU S35        X:  a#  [         R                  SU SU SUS-   S35        g	g	)
rN   zYour min_length=z' must be inferior than your max_length=Ú.zYour max_length is set to z , but your input_length is only z¶. Since this is a summarization task, where outputs shorter than the input are typically wanted, you might consider decreasing max_length manually, e.g. summarizer('...', max_length=r   Ú)N©ÚloggerÚwarningrO   s       r   rP   Ú"SummarizationPipeline.check_inputs1  sm   € ð Ó"ÜN‰NÐ-¨j¨\Ð9`ÐakÐ`lÐlmÐnÔoàÓ$ÜN‰NØ,¨Z¨LÐ8XÐYeÐXfð g^à^jÐnoÑ^oÐ]pÐpqðsõð %r   r   )r   r   r   r   r   r…   rj   r”   ÚboolrP   r   r—   r˜   s   @r   rš   rš   õ   s;   ø† ñð< €Kõ1ð4¨ð ¸#ð È3ð ÐSW÷ ò r   rš   c                   ó‚   ^ • \ rS rSrSrSrS\S\S\4S jr\R                  SSS	.U 4S
 jjr
SU 4S jjrU 4S jrSrU =r$ )ÚTranslationPipelinei@  a  
Translates from one language to another.

This translation pipeline can currently be loaded from [`pipeline`] using the following task identifier:
`"translation_xx_to_yy"`.

The models that this pipeline can use are models that have been fine-tuned on a translation task. See the
up-to-date list of available models on [huggingface.co/models](https://huggingface.co/models?filter=translation).
For a list of available parameters, see the [following
documentation](https://huggingface.co/docs/transformers/en/main_classes/text_generation#transformers.generation.GenerationMixin.generate)

Unless the model you're using explicitly sets these generation parameters in its configuration files
(`generation_config.json`), the following default values will be used:
- max_new_tokens: 256
- num_beams: 4

Usage:

```python
en_fr_translator = pipeline("translation_en_to_fr")
en_fr_translator("How old are you?")
```ÚtranslationrJ   rK   rL   c                 óN   • USU-  :”  a  [         R                  SU SU S35        g)NgÍÌÌÌÌÌì?zYour input_length: z" is bigger than 0.9 * max_length: z`. You might consider increasing your max_length manually, e.g. translator('...', max_length=400)Tr£   rO   s       r   rP   Ú TranslationPipeline.check_inputs\  s=   € Ø˜# 
Ñ*Ó*ÜN‰NØ% l ^Ð3UÐV`ÐUað b^ð ^ôð r   N)r4   Úsrc_langÚtgt_langc                óª   >• [        U R                  SS 5      (       a'  U R                  R                  " X@R                  XUS.6$ [        TU ]  " USU06$ )NÚ_build_translation_inputs)r@   r4   r­   r®   r4   )Úgetattrr:   r°   r,   r)   r_   )r.   r4   r­   r®   r/   r1   s        €r   ro   ÚTranslationPipeline.preprocessd  sQ   ø€ Ü4—>‘>Ð#>À×EÑEØ—>‘>×;Ò;Ø§n¡nÀÐiqòð ô ‘7Ò.°ÐLÀÑLÐLr   c                 ó   >• [         T	U ]  " S0 UD6u  pEnUb  XS'   Ub  X$S'   UcV  UcS  UR                  SU R                  5      nUR	                  S5      nU(       a  [        U5      S:X  a  US   US'   US   US'   XEU4$ )	Nr­   r®   ÚtaskÚ_r#   r   é   r   )r)   rH   rx   r´   Úsplitr=   )
r.   r­   r®   r0   rD   rE   rF   r´   Úitemsr1   s
            €r   rH   Ú(TranslationPipeline._sanitize_parametersl  sœ   ø€ Ü@EÁÒ@\Ñ@fÐ_eÑ@fÑ=ÐÐ+=ØÑØ,4˜jÑ)ØÑØ,4˜jÑ)ØÑ Ñ 0à—:‘:˜f d§i¡iÓ0ˆDØ—J‘J˜s“OˆEÞœ˜E›
 a›à05°a±Ð! *Ñ-Ø05°a±Ð! *Ñ-Ø Ð2DÐDÐDr   c                 ó$   >• [         TU ]  " U0 UD6$ )a¸  
Translate the text(s) given as inputs.

Args:
    args (`str` or `list[str]`):
        Texts to be translated.
    return_tensors (`bool`, *optional*, defaults to `False`):
        Whether or not to include the tensors of predictions (as token indices) in the outputs.
    return_text (`bool`, *optional*, defaults to `True`):
        Whether or not to include the decoded texts in the outputs.
    clean_up_tokenization_spaces (`bool`, *optional*, defaults to `False`):
        Whether or not to clean up the potential extra spaces in the text output.
    src_lang (`str`, *optional*):
        The language of the input. Might be required for multilingual models. Will not have any effect for
        single pair translation models
    tgt_lang (`str`, *optional*):
        The language of the desired output. Might be required for multilingual models. Will not have any effect
        for single pair translation models
    generate_kwargs:
        Additional keyword arguments to pass along to the generate method of the model (see the generate method
        corresponding to your framework [here](./text_generation)).

Return:
    A list or a list of list of `dict`: Each result comes as a dictionary with the following keys:

    - **translation_text** (`str`, present when `return_text=True`) -- The translation.
    - **translation_token_ids** (`torch.Tensor` or `tf.Tensor`, present when `return_tensors=True`) -- The
      token ids of the translation.
rž   r-   s      €r   rj   ÚTranslationPipeline.__call__|  s   ø€ ô< ‰wÒ Ð0¨Ñ0Ð0r   r   )NN)r   r   r   r   r   r…   r”   rP   r   r–   ro   rH   rj   r   r—   r˜   s   @r   r©   r©   @  sV   ø† ñð0  €Kð¨ð ¸#ð È3ô ð ,>×+MÑ+MÐX\Ðgk÷ Mð M÷E÷ 1ó 1r   r©   )Úenumr>   Útypingr   r   Ú
generationr   Útokenization_utilsr   Úutilsr   r	   r
   r   Úbaser   r   Ú
tensorflowr(   Úmodels.auto.modeling_tf_autor   Úmodels.auto.modeling_autor   Ú
get_loggerr   r¤   ÚEnumr   r    rš   r©   r   r   r   Ú<module>rÇ      sÜ   ðÛ Û ß å )Ý 3ß TÓ Tß 4ñ ×ÑÛå^á×ÑÝXà	×	Ò	˜HÓ	%€ô—‘ô ñ
 Ñ,¸4Ñ@ÓAôV (ó Vó BðVñr Ñ,¸4Ñ@ÓAôGÐ7ó Gó BðGñT Ñ,¸4Ñ@ÓAôY1Ð5ó Y1ó BñY1r   