o
    0j                     @   s   d dl mZmZmZmZmZ d dlZddlm	Z	 ddl
mZmZ ddlmZ ddlmZ d	d
lmZ eje	dG dd deZdS )    )AnyDictListOptionalUnionN   )pipeline_requires_extra   )	HPIConfigPaddlePredictorOption)WhisperResult)	benchmark   )BasePipelineZspeechc                       s   e Zd ZdZdZddddddddedee dee d	eeeef  d
ee	 de
deeeeef ef  ddf fddZdeeee ejeej f defddZ  ZS )%MultilingualSpeechRecognitionPipelinez(Multilingual Speech Recognition PipelineZmultilingual_speech_recognitionNFdeviceengineengine_config	pp_optionuse_hpip
hpi_configconfigr   r   r   r   r   r   returnc          
   	      sD   t  jd||||||d| |d d }	| |	| _|	d  dS )a)  Initializes the multilingual speech recognition pipeline.

        Args:
            config (Dict): Configuration dictionary containing model and other parameters.
            device (Optional[str], optional): The device to use for prediction. Defaults to `None`.
            engine (Optional[str], optional): Inference engine. Defaults to `None`.
            engine_config (Optional[Dict[str, Any]], optional): Engine-specific config. Defaults to `None`.
            pp_option (Optional[PaddlePredictorOption], optional): Paddle predictor options.
                Defaults to `None`.
            use_hpip (bool, optional): Whether to use HPIP. Defaults to `False`.
            hpi_config (Optional[Union[Dict[str, Any], HPIConfig]], optional):
                HPIP configuration. Defaults to `None`.
        r   Z
SubModulesZMultilingualSpeechRecognitionZ
batch_sizeN )super__init__Zcreate_model%multilingual_speech_recognition_model)
selfr   r   r   r   r   r   r   kwargsZ,multilingual_speech_recognition_model_config	__class__r   /var/www/html/Deteccion_Ine/venv/lib/python3.10/site-packages/paddlex/inference/pipelines/multilingual_speech_recognition/pipeline.pyr   !   s"   
z.MultilingualSpeechRecognitionPipeline.__init__inputc                 k   s    |  |E dH  dS )ar  Predicts speech recognition results for the given input.

        Args:
            input (Union[str, list[str], np.ndarray, list[np.ndarray]]): The input audio or path.
            **kwargs: Additional keyword arguments that can be passed to the function.

        Returns:
            WhisperResult: The predicted whisper results, support str and json output.
        N)r   )r   r#   r   r   r   r"   predictM   s   z-MultilingualSpeechRecognitionPipeline.predict)__name__
__module____qualname____doc__entitiesr   r   strr   r   boolr   r
   r   r   npZndarrayr   r$   __classcell__r   r   r    r"   r      s>    	,r   )typingr   r   r   r   r   numpyr,   Z
utils.depsr   modelsr
   r   Z-models.multilingual_speech_recognition.resultr   Zutils.benchmarkr   baser   Ztime_methodsr   r   r   r   r"   <module>   s   