
    .`iv                     r    d dl mZ d dlmZ  G d de          Z G d de          Z G d de          Zd	S )
    )Any)PretrainedConfigc                   8     e Zd ZdZ	 	 	 	 	 	 	 	 	 	 d fd	Z xZS )Step3VisionEncoderConfigstep3_vision_encoder         ?              
quick_geluh㈵>c                     || _         || _        || _        || _        || _        || _        || _        || _        |
| _        |	| _	         t                      j        di | d S N )hidden_sizeintermediate_sizeoutput_hidden_sizenum_hidden_layersnum_attention_headsnum_channels
patch_size
image_sizelayer_norm_eps
hidden_actsuper__init__)selfr   r   r   r   r   r   r   r   r   r   kwargs	__class__s               |/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/vllm/transformers_utils/configs/step3_vl.pyr    z!Step3VisionEncoderConfig.__init__   su     '!2"4!2#6 ($$,$""6"""""    )
r   r	   r
   r   r   r   r   r   r   r   )__name__
__module____qualname__
model_typer    __classcell__r#   s   @r$   r   r      sb        'J # # # # # # # # # #r%   r   c            '            e Zd ZdZdgZ	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 d(dedededededededededededeee	f         dz  ded ed!ed"ed#e
d$eed%f         d&df& fd'Z xZS ))Step3TextConfig
step3_textStep3TextForCausalLM    H  @      =      / r      0   r   N      F8               	   
            r      r                                                    !   "   #   $   %   &   '   (   )   *   +   ,   -   .   /   r8   1   2   3   4   5   6   7   8   9   :   ;   r   r   r   num_attention_groupsr   max_seq_len
vocab_sizerms_norm_epsmoe_intermediate_sizemoe_num_experts	moe_top_krope_parametersmax_position_embeddingshare_expert_dimshare_q_dimhead_dimnorm_expert_weightmoe_layers_enum.returnc                    || _         || _        || _        || _        || _        || _        || _        || _        |	| _        |
| _	        || _
        |                    dd           }|p|pddi}|                    dd          }d|vr||d<   || _        || _        || _        || _        || _        || _        || _         t'                      j        di | d S )Nrope_scaling	rope_typedefault
rope_thetag    Ar   )r   r   r   rq   r   rr   rs   rt   ru   rv   rw   poprx   ry   rz   r{   r|   r}   r~   r   r    )r!   r   r   r   rq   r   rr   rs   rt   ru   rv   rw   rx   ry   rz   r{   r|   r}   r~   r"   r   r   r#   s                         r$   r    zStep3TextConfig.__init__*   s   ^ '!2#6 $8!!2&$(%:"."zz.$77&U/Uk9=UZZh77
..,6OL).&<# 0& "4.""6"""""r%   )r0   r1   r2   r3   r4   r5   r6   r   r7   r8   r   Nr5   r7   r9   r:   Fr;   )r&   r'   r(   r)   architecturesintfloatdictstrr   booltupler    r*   r+   s   @r$   r-   r-   &   sz       J+,M  !&#%$%!#  "%)!15&+ $#(9,
'h# h#h# h# !	h#
 "h# h# h# h# h#  #h# h# h# c3h$.h# !$h# h#  !h#" #h#$ !%h#& sCx'h#\ 
]h# h# h# h# h# h# h# h# h# h#r%   r-   c                   `     e Zd ZdZ	 	 	 	 	 ddeez  dz  deez  dz  ded	ed
eddf fdZ	 xZ
S )Step3VLConfigstep3_vlNr3   T vision_configtext_configunderstand_projector_strideprojector_biasimage_token_idr   c                 `   |t                      }n!t          |t                    rt          di |}|| _        |t	                      }n!t          |t                    rt	          di |}|| _        || _        || _        |j        | _        || _	         t                      j        di | d S r   )r   
isinstancer   r   r-   r   r   r   r   r   r   r    )r!   r   r   r   r   r   r"   r#   s          r$   r    zStep3VLConfig.__init__   s      466MMt,, 	F4EE}EEM*)++KKT** 	9)88K88K&+F(,&2,""6"""""r%   )NNr3   Tr   )r&   r'   r(   r)   r   r   r-   r   r   r    r*   r+   s   @r$   r   r      s        J AE59+,#$# #66=# O+d2# &)	#
 # # 
# # # # # # # # # #r%   r   N)typingr    transformers.configuration_utilsr   r   r-   r   r   r%   r$   <module>r      s          = = = = = =# # # # #/ # # #<l# l# l# l# l#& l# l# l#^# # # # #$ # # # # #r%   