
    .`i)                     j    d dl mZmZ  G d de          Z G d de          Z G d de          ZdS )	    )DeepseekV2ConfigPretrainedConfigc                   L    e Zd ZU dZeed<   dZeed<   dZeed<   dZ	eed<   d	Z
eed
<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   dZeed<   	 	 	 	 	 	 	 	 	 	 	 	 ddededed
ededededededededef fdZ xZS )VisionEncoderConfigvision
model_type#vit_so400m_patch14_siglip_384.webli
model_name  
image_size   
patch_size   width   layersheads   	mlp_ratiomapglobal_poolTignore_headFclass_tokenr   num_classesuse_checkpointskipweight_initdeterministicnum_recomputing_layersc                     || _         || _        || _        || _        || _        || _        || _        || _        |	| _        |
| _	        || _
        || _         t                      j        di | d S N )r
   r   r   r   r   r   r   r   r   r   r   r   super__init__)selfr
   r   r   r   r   r   r   r   r   r   r   r   kwargs	__class__s                 /home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/vllm/transformers_utils/configs/deepseek_vl2.pyr$   zVisionEncoderConfig.__init__   s      %$$

"&&&&,""6"""""    )r	   r   r   r   r   r   r   r   TFr   F)__name__
__module____qualname__r   str__annotations__r
   r   intr   r   r   r   r   r   r   boolr   r   r   r   r   r   r$   __classcell__r'   s   @r(   r   r   	   s        J;J;;;JJE3FCE3OOOIsKKKK ND   KM4"#C### @  !$# ## # 	#
 # # # # # # # # # # # # # # # # # #r)   r   c                        e Zd ZU dZdZeed<   dZeed<   dZ	eed<   dZ
eed	<   d
Zeed<   dZeed<   dZeed<   	 	 	 	 	 	 ddededed	ededef fdZ xZS )MlpProjectorConfigmlp_projectordownsample_mlp_geluprojector_type  	input_dim   n_embed   depth   r   downsample_ratioFtoken_poolingc                     || _         || _        || _        || _        || _        || _         t                      j        di | d S r!   )r7   r9   r;   r=   r   r?   r#   r$   )	r%   r7   r9   r;   r=   r   r?   r&   r'   s	           r(   r$   zMlpProjectorConfig.__init__F   sT     -"
" 0""6"""""r)   )r6   r8   r:   r<   r>   r<   )r*   r+   r,   r   r7   r-   r.   r9   r/   r;   r=   r   r?   r@   r0   r$   r1   r2   s   @r(   r4   r4   <   s         J/NC///IsGSE3NNNIscM4 4 !# ## # 	#
 # # # # # # # # # # # #r)   r4   c            
            e Zd ZU dZeed<   eed<   dZeed<   dZ	eed<   dZ
eeeef                  ed	<   	 	 	 ddeded	eeeef                  f fd
Z xZS )DeepseekVLV2Configdeepseek_vl_v2vision_configprojector_config2Dtile_tagheadglobal_view_pos)r   r   candidate_resolutionsc                     t                      j        di | |                    di           }t          di || _        |                    di           }t          di || _        |                    di           }t          di || _        || _	        || _
        || _        | j        j        | _        d| j        p|                    dg           v r	d| _        d S d S )NrE   rF   language_configDeepseekOCRForCausalLMarchitecturesdeepseek_ocrr"   )r#   r$   getr   rE   r4   rF   r   text_configrH   rJ   rL   
vocab_sizerP   r   )	r%   rH   rJ   rL   r&   rE   rF   rN   r'   s	           r(   r$   zDeepseekVLV2Config.__init__c   s    	""6"""

?B770AA=AA!::&8"== 2 F F5E F F **%6;;+>>o>> .%:"*5 $A&**_b"A"A
 
 -DOOO
 
r)   )rH   rI   rK   )r*   r+   r,   r   r   r.   r4   rH   r-   rJ   rL   tupler/   r$   r1   r2   s   @r(   rC   rC   Z   s         !J&&&&((((Hc!OS!!!4A5sCx1AAA #%8E	- -- -  %U38_5	- - - - - - - - - -r)   rC   N)transformersr   r   r   r4   rC   r"   r)   r(   <module>rW      s    < ; ; ; ; ; ; ;0# 0# 0# 0# 0#* 0# 0# 0#f# # # # #) # # #<$- $- $- $- $-) $- $- $- $- $-r)   