ó
    <±hÀ+  ã                   óþ   • S SK r S SKJrJr  S SKrS SKrSSKJrJ	r	J
r
JrJr  SSKJrJr  \	" 5       (       a  SSKJr  \R$                  " \5      rS\S	\S
\R.                  4S jr\" \" SS95       " S S\5      5       rg)é    N)ÚAnyÚUnioné   )Úadd_end_docstringsÚis_torch_availableÚis_torchaudio_availableÚis_torchcodec_availableÚloggingé   )ÚPipelineÚbuild_pipeline_init_args)Ú,MODEL_FOR_AUDIO_CLASSIFICATION_MAPPING_NAMESÚbpayloadÚsampling_rateÚreturnc                 ó|  • U nSnSnSSSSUSUSUS	S
SS/n [         R                  " U[         R                  [         R                  S9nUR                  U 5      nUS   n[        R                  " U[        R                  5      n	U	R                  S   S:X  a  [	        S5      eU	$ ! [         a    [	        S5      ef = f)z7
Helper function to read an audio file through ffmpeg.
Ú1Úf32leÚffmpegz-izpipe:0z-acz-arz-fz-hide_bannerz	-loglevelÚquietzpipe:1)ÚstdinÚstdoutzFffmpeg was not found but is required to load audio files from filenamer   zMalformed soundfile)
Ú
subprocessÚPopenÚPIPEÚFileNotFoundErrorÚ
ValueErrorÚcommunicateÚnpÚ
frombufferÚfloat32Úshape)
r   r   ÚarÚacÚformat_for_conversionÚffmpeg_commandÚffmpeg_processÚoutput_streamÚ	out_bytesÚaudios
             Úc/var/www/html/shao/venv/lib/python3.13/site-packages/transformers/pipelines/audio_classification.pyÚffmpeg_readr,      sÙ   € ð ˆ?€BØ	€BØ#ÐàØØØØ
ØØ
ØØØØØØð€Nð cÜ#×)Ò)¨.Ä
ÇÁÔXb×XgÑXgÑhˆð #×.Ñ.¨xÓ8€MØ˜aÑ €IäMŠM˜)¤R§Z¡ZÓ0€EØ‡{{1~˜ÓÜÐ.Ó/Ð/Ø€Løô ó cÜÐaÓbÐbðcús   ˜2B% Â%B;T)Úhas_feature_extractorc            	       óª   ^ • \ rS rSrSrSrSrSrSrU 4S jr	S\
\R                  \\\4   S\S\\\\4      4U 4S	 jjrSS
 jrS rS rSS jrSrU =r$ )ÚAudioClassificationPipelineéB   aÄ  
Audio classification pipeline using any `AutoModelForAudioClassification`. This pipeline predicts the class of a
raw waveform or an audio file. In case of an audio file, ffmpeg should be installed to support multiple audio
formats.

Example:

```python
>>> from transformers import pipeline

>>> classifier = pipeline(model="superb/wav2vec2-base-superb-ks")
>>> classifier("https://huggingface.co/datasets/Narsil/asr_dummy/resolve/main/1.flac")
[{'score': 0.997, 'label': '_unknown_'}, {'score': 0.002, 'label': 'left'}, {'score': 0.0, 'label': 'yes'}, {'score': 0.0, 'label': 'down'}, {'score': 0.0, 'label': 'stop'}]
```

Learn more about the basics of using a pipeline in the [pipeline tutorial](../pipeline_tutorial)


This pipeline can currently be loaded from [`pipeline`] using the following task identifier:
`"audio-classification"`.

See the list of available models on
[huggingface.co/models](https://huggingface.co/models?filter=audio-classification).
FTc                 óÜ   >• SU;   a  US   c  S US'   OSU;  a  SUS'   [         TU ]  " U0 UD6  U R                  S:w  a  [        SU R                   S35      eU R                  [        5        g )NÚtop_ké   ÚptzThe z is only available in PyTorch.)ÚsuperÚ__init__Ú	frameworkr   Ú	__class__Úcheck_model_typer   )ÚselfÚargsÚkwargsr8   s      €r+   r6   Ú$AudioClassificationPipeline.__init__b   su   ø€ àfÓ ¨¡Ñ!8Ø"ˆF7ŠOØ˜FÓ"ØˆF7‰OÜ‰Ò˜$Ð) &Ò)à>‰>˜TÓ!Ü˜t D§N¡NÐ#3Ð3QÐRÓSÐSà×ÑÔJÕKó    Úinputsr<   r   c                 ó&   >• [         TU ]  " U40 UD6$ )aÀ  
Classify the sequence(s) given as inputs. See the [`AutomaticSpeechRecognitionPipeline`] documentation for more
information.

Args:
    inputs (`np.ndarray` or `bytes` or `str` or `dict`):
        The inputs is either :
            - `str` that is the filename of the audio file, the file will be read at the correct sampling rate
              to get the waveform using *ffmpeg*. This requires *ffmpeg* to be installed on the system.
            - `bytes` it is supposed to be the content of an audio file and is interpreted by *ffmpeg* in the
              same way.
            - (`np.ndarray` of shape (n, ) of type `np.float32` or `np.float64`)
                Raw audio at the correct sampling rate (no further check will be done)
            - `dict` form can be used to pass raw audio sampled at arbitrary `sampling_rate` and let this
              pipeline do the resampling. The dict must be either be in the format `{"sampling_rate": int,
              "raw": np.array}`, or `{"sampling_rate": int, "array": np.array}`, where the key `"raw"` or
              `"array"` is used to denote the raw audio waveform.
    top_k (`int`, *optional*, defaults to None):
        The number of top labels that will be returned by the pipeline. If the provided number is `None` or
        higher than the number of labels available in the model configuration, it will default to the number of
        labels.
    function_to_apply(`str`, *optional*, defaults to "softmax"):
        The function to apply to the model output. By default, the pipeline will apply the softmax function to
        the output of the model. Valid options: ["softmax", "sigmoid", "none"]. Note that passing Python's
        built-in `None` will default to "softmax", so you need to pass the string "none" to disable any
        post-processing.

Return:
    A list of `dict` with the following keys:

    - **label** (`str`) -- The label predicted.
    - **score** (`float`) -- The corresponding probability.
)r5   Ú__call__)r:   r?   r<   r8   s      €r+   rA   Ú$AudioClassificationPipeline.__call__o   s   ø€ ôD ‰wÒ Ñ1¨&Ñ1Ð1r>   c                 ó0  • 0 nUc$  U R                   R                  R                  US'   OGXR                   R                  R                  :”  a   U R                   R                  R                  nXS'   Ub  US;  a  [        SU S35      eX$S'   OSUS'   0 0 U4$ )Nr2   )ÚsoftmaxÚsigmoidÚnonez'Invalid value for `function_to_apply`: z2. Valid options are ['softmax', 'sigmoid', 'none']Úfunction_to_applyrD   )ÚmodelÚconfigÚ
num_labelsr   )r:   r2   rG   r<   Úpostprocess_paramss        r+   Ú_sanitize_parametersÚ0AudioClassificationPipeline._sanitize_parameters“   sµ   € ØÐð ‰=Ø*.¯*©*×*;Ñ*;×*FÑ*FÐ˜wÒ'à—z‘z×(Ñ(×3Ñ3Ó3ØŸ
™
×)Ñ)×4Ñ4Ø*/˜wÑ'àÑ(Ø Ð(FÓFÜ Ø=Ð>OÐ=Pð QGð Góð ð 7HÐ2Ò3à6?ÐÐ2Ñ3Ø2Ð)Ð)Ð)r>   c                 ó”  • [        U[        5      (       ar  UR                  S5      (       d  UR                  S5      (       a!  [        R                  " U5      R
                  nO%[        US5       nUR                  5       nS S S 5        [        U[        5      (       a  [        XR                  R                  5      n[        5       (       a<  SS Kn[        XR                  5      (       a  UR                  5       R!                  5       n[#        5       (       aV  SS KnSS Kn[        XR&                  R(                  5      (       a*  UR+                  5       nUR,                  nXeR.                  S.n[        U[0        5      (       Ga  UR3                  5       nSU;   a  SU;   d  SU;   d  [5        S	5      eUR7                  SS 5      nUc$  UR7                  S
S 5        UR7                  SS 5      nUR7                  S5      nUnX€R                  R                  :w  aŠ  SS Kn[9        5       (       a  SSKJn	  O[?        S5      eU	RA                  [        U[B        RD                  5      (       a  URG                  U5      OUUU R                  R                  5      R!                  5       n[        U[B        RD                  5      (       d  [I        S5      e[K        URL                  5      S:w  a  [5        S5      eU R                  XR                  R                  SS9n
U RN                  b  U
RQ                  U RN                  S9n
U
$ ! , (       d  f       GN¿= f)Nzhttp://zhttps://Úrbr   )Úarrayr   r   ÚrawrP   zôWhen passing a dictionary to AudioClassificationPipeline, the dict needs to contain a "raw" key containing the numpy array or torch tensor representing the audio and a "sampling_rate" key, containing the sampling_rate associated with that arrayÚpath)Ú
functionalz›torchaudio is required to resample audio samples in AudioClassificationPipeline. The torchaudio package can be installed through: `pip install torchaudio`.z2We expect a numpy ndarray or torch tensor as inputr   zFWe expect a single channel audio input for AudioClassificationPipeliner4   )r   Úreturn_tensors)Údtype))Ú
isinstanceÚstrÚ
startswithÚrequestsÚgetÚcontentÚopenÚreadÚbytesr,   Úfeature_extractorr   r   ÚtorchÚTensorÚcpuÚnumpyr	   Ú
torchcodecÚdecodersÚAudioDecoderÚget_all_samplesÚdataÚsample_rateÚdictÚcopyr   Úpopr   Ú
torchaudiorS   ÚImportErrorÚresampler   ÚndarrayÚ
from_numpyÚ	TypeErrorÚlenr"   Útorch_dtypeÚto)r:   r?   Úfr`   rd   Ú_audio_samplesÚ_arrayÚ_inputsÚin_sampling_rateÚFÚ	processeds              r+   Ú
preprocessÚ&AudioClassificationPipeline.preprocess©   s©  € Üfœc×"Ñ"Ø× Ñ  ×+Ñ+¨v×/@Ñ/@À×/LÑ/Lô "Ÿš fÓ-×5Ñ5‘ä˜& $Ô'¨1ØŸV™V›XF÷ (ô fœe×$Ñ$Ü  ×)?Ñ)?×)MÑ)MÓNˆFä×ÑÛä˜&§,¡,×/Ñ/ØŸ™›×+Ñ+Ó-ä"×$Ñ$ÛÛä˜&×"5Ñ"5×"BÑ"B×CÑCØ!'×!7Ñ!7Ó!9Ø'×,Ñ,Ø#)×<VÑ<VÑWäfœd×#Ò#Ø—[‘[“]ˆFð $ vÓ-°5¸F³?ÀgÐQWÓFWÜ ðNóð ð —j‘j ¨Ó-ˆGØ‰à—
‘
˜6 4Ô(Ø Ÿ*™* W¨dÓ3Ø%Ÿz™z¨/Ó:ÐØˆFØ×#9Ñ#9×#GÑ#GÓGÛä*×,Ñ,Þ:ä%ðeóð ð
 Ÿ™Ü0:¸6Ä2Ç:Á:×0NÑ0NE×$Ñ$ VÔ,ÐTZØ$Ø×*Ñ*×8Ñ8ó÷ ‘%“'ð	 ô ˜&¤"§*¡*×-Ñ-ÜÐPÓQÐQÜˆv|‰|Ó Ó!ÜÐeÓfÐfà×*Ñ*Ø×"8Ñ"8×"FÑ"FÐW[ð +ð 
ˆ	ð ×ÑÑ'Ø!Ÿ™¨4×+;Ñ+;˜Ð<ˆIØÐ÷E (Ö'ús   Á/L8Ì8
Mc                 ó*   • U R                   " S0 UD6nU$ )N© )rH   )r:   Úmodel_inputsÚmodel_outputss      r+   Ú_forwardÚ$AudioClassificationPipeline._forwardô   s   € ØŸ
š
Ñ2 \Ñ2ˆØÐr>   c                 óª  • US:X  a  UR                   S   R                  S5      nO3US:X  a  UR                   S   R                  5       nOUR                   S   nUR                  U5      u  pVUR	                  5       nUR	                  5       n[        XV5       VVs/ sH*  u  pxXpR                  R                  R                  U   S.PM,     n	nnU	$ s  snnf )NrD   r   éÿÿÿÿrE   )ÚscoreÚlabel)	ÚlogitsrD   rE   ÚtopkÚtolistÚziprH   rI   Úid2label)
r:   r‚   r2   rG   ÚprobsÚscoresÚidsr‡   Ú_idÚlabelss
             r+   ÚpostprocessÚ'AudioClassificationPipeline.postprocessø   s¿   € Ø 	Ó)Ø!×(Ñ(¨Ñ+×3Ñ3°BÓ7‰EØ )Ó+Ø!×(Ñ(¨Ñ+×3Ñ3Ó5‰Eà!×(Ñ(¨Ñ+ˆEØ—j‘j Ó'‰ˆà—‘“ˆØj‰j‹lˆä_bÐciÔ_oÔpÑ_oÑQ[ÐQV˜E¯J©J×,=Ñ,=×,FÑ,FÀsÑ,KÔLÑ_oˆÑpàˆùó qs   Â0Cr€   )NN)r3   rD   )Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Ú_load_processorÚ_load_image_processorÚ_load_feature_extractorÚ_load_tokenizerr6   r   r   rp   r^   rW   rj   r   ÚlistrA   rL   r}   rƒ   r“   Ú__static_attributes__Ú__classcell__)r8   s   @r+   r/   r/   B   s   ø† ñð2 €OØ!ÐØ"ÐØ€OõLð"2˜u R§Z¡Z°¸¸TÐ%AÑBð "2Ècð "2ÐVZÐ[_Ð`cÐehÐ`hÑ[iÑVj÷ "2ôH*ò,IòV÷ò r>   r/   )r   Útypingr   r   rc   r   rY   Úutilsr   r   r   r	   r
   Úbaser   r   Úmodels.auto.modeling_autor   Ú
get_loggerr•   Úloggerr^   Úintrp   r,   r/   r€   r>   r+   Ú<module>r¨      sƒ   ðó ß ã Û ç uÕ uß 4ñ ×ÑÝXà	×	Ò	˜HÓ	%€ð!˜%ð !°ð !¸¿
¹
ô !ñH Ñ,À4ÑHÓIôC (ó Có JñCr>   