§
    .`ƒiP  ã                   ó@   — d dl mZ d dlZ G d„ dej        ¦  «        ZdS )é    )ÚAnyNc                   óø   ‡ — e Zd ZU dZej        ed<   dZdZdZ		 	 	 	 	 	 	 	 	 	 	 	 dde
eef         dz  de
eef         dz  dedz  dedz  dedededededededefˆ fd„Zˆ fd„Zedej        fd„¦   «         Zˆ xZS )ÚUltravoxConfigaµ  
    This is the configuration class to store the configuration of a
    [`UltravoxForConditionalGeneration`]. It is used to instantiate an
    Ultravox model according to the specified arguments, defining the model
    architecture.

    Configuration objects inherit from [`PretrainedConfig`] and can be used to
    control the model outputs. Read the documentation from [`PretrainedConfig`]
    for more information.

    Args:
        audio_config (`Union[AutoConfig, dict]`,  *optional*):
            Custom audio config or dict.
        text_config (`Union[AutoConfig, dict]`, *optional*):
            The config object of the text backbone.
        audio_model_id (`str`, *optional*):
            The model ID of the audio backbone.
        text_model_id (`str`, *optional*):
            The model ID of the text backbone.
        ignore_index (`int`, *optional*, defaults to -100):
            The ignore index for the loss function.
        audio_token_index (`int`, *optional*, defaults to 32000):
            The audio token index to encode the audio prompt.
        stack_factor (`int`, *optional*, defaults to 8):
            Audio downsampling factor for the multimodal projector.
        norm_init (`float`, *optional*, defaults to 0.4):
            The initialization value for the layer normalization.
        projector_act (`str`, *optional*, defaults to `"swiglu"`):
            The activation function used by the multimodal projector.
        projector_ln_mid (`bool`, *optional*, defaults to `False`):
            Whether to apply layer normalization at the middle of the
            projector or at the end. Versions v0.4.1 and below
            use `False`, but v0.5 and above use `True`.
    Úwrapped_model_configÚultravoxz	<|audio|>FNéœÿÿÿé }  é   é   çš™™™™™Ù?Úswiglur   Úaudio_configÚtext_configÚaudio_model_idÚtext_model_idÚignore_indexÚaudio_token_indexÚhidden_sizeÚstack_factorÚ	norm_initÚprojector_actÚprojector_ln_midÚnum_projector_layersc                 ó¬  •— || _         || _        || _        || _        |	| _        |
| _        || _        || _        || _        |€4|pi }t          j
        |                     dd¦  «                 di |¤Ž| _        || _        |€;d | _        |pi }t          j
        |                     dd¦  «                 di |¤Ž| _         t          ¦   «         j        di |¤Ž d S )NÚ
model_typeÚllamaÚwhisper© )r   r   r   r   r   r   r   r   r   ÚtransformersÚCONFIG_MAPPINGÚgetr   r   r   ÚsuperÚ__init__)Úselfr   r   r   r   r   r   r   r   r   r   r   r   ÚkwargsÚ	__class__s                 €ú|/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/vllm/transformers_utils/configs/ultravox.pyr#   zUltravoxConfig.__init__3   s  ø€ ð  )ˆÔØ!2ˆÔà&ˆÔØ(ˆÔØ"ˆŒØ*ˆÔØ 0ˆÔØ$8ˆÔ!ð +ˆÔØÐ Ø%Ð+¨ˆKÝ(4Ô(CØ—’ ¨gÑ6Ô6ô)ð )ð )àð)ð )ˆDÔ%ð
 -ˆÔØÐ!Ø"&ˆDÔØ'Ð-¨2ˆLÝ ,Ô ;Ø× Ò  ¨yÑ9Ô9ô!ð !ð !àð!ð !ˆDÔð 	‰ŒÔÐ"Ð"˜6Ð"Ð"Ð"Ð"Ð"ó    c                 óÊ   •— |dk    r|ddl m}  ||d¬¦  «        | _        n |dk    r|ddl m}  ||d¬¦  «        | _        t	          ¦   «                              ||¦  «        S )Nr   r   )Ú
get_configF)Útrust_remote_coder   )Úvllm.transformers_utils.configr*   r   r   r"   Ú__setattr__)r$   ÚkeyÚvaluer*   r&   s       €r'   r-   zUltravoxConfig.__setattr__`   s•   ø€ ð /Ò!Ð! eÐ&7ØAÐAÐAÐAÐAÐAà(2¨
°5ÈEÐ(RÑ(RÔ(RˆDÔ%Ð%ØÐ$Ò$Ð$¨Ð):ØAÐAÐAÐAÐAÐAà * 
¨5ÀEÐ JÑ JÔ JˆDÔå‰wŒw×"Ò" 3¨Ñ.Ô.Ð.r(   Úreturnc                 ó4   — | j                              ¦   «         S )N)r   Úget_text_config)r$   s    r'   r   zUltravoxConfig.text_configs   s   € ð
 Ô(×8Ò8Ñ:Ô:Ð:r(   )NNNNr   r	   r
   r   r   r   Fr   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   ÚPretrainedConfigÚ__annotations__r   Úaudio_tokenÚis_compositionÚdictÚstrr   ÚintÚfloatÚboolr#   r-   Úpropertyr   Ú__classcell__)r&   s   @r'   r   r   
   sq  ø€ € € € € € ð!ð !ðF 'Ô7Ð7Ð7Ñ7Ø€JØ€KØ€Nð /3Ø-1Ø%)Ø$(Ø Ø!&ØØØØ%Ø!&Ø$%ð+#ð +#à˜3 ˜8”n tÑ+ð+#ð ˜#˜s˜(”^ dÑ*ð+#ð ˜d™
ð	+#ð
 ˜T‘zð+#ð ð+#ð ð+#ð ð+#ð ð+#ð ð+#ð ð+#ð ð+#ð "ð+#ð +#ð +#ð +#ð +#ð +#ðZ/ð /ð /ð /ð /ð& ð;˜\Ô:ð ;ð ;ð ;ñ „Xð;ð ;ð ;ð ;ð ;r(   r   )Útypingr   r   r7   r   r   r(   r'   ú<module>rC      sf   ðð
 Ð Ð Ð Ð Ð à Ð Ð Ð ðn;ð n;ð n;ð n;ð n;\Ô2ñ n;ô n;ð n;ð n;ð n;r(   