
    Pi	                         d dl mZ i dddddddd	d
dddddddddddddddddddddd d!d"d#d$d%d&d'Zh d(Zd) Zd*S )+    )get_mapped_keyz,text_model.embeddings.token_embedding.weightztoken_embedding.weightz/text_model.embeddings.position_embedding.weightposition_embeddingz/text_model.encoder.layers.{}.layer_norm1.weightzlayers.{}.sa_norm.weightz-text_model.encoder.layers.{}.layer_norm1.biaszlayers.{}.sa_norm.biasz/text_model.encoder.layers.{}.layer_norm2.weightzlayers.{}.mlp_norm.weightz-text_model.encoder.layers.{}.layer_norm2.biaszlayers.{}.mlp_norm.biasz+text_model.encoder.layers.{}.mlp.fc1.weightzlayers.{}.mlp.w1.weightz)text_model.encoder.layers.{}.mlp.fc1.biaszlayers.{}.mlp.w1.biasz+text_model.encoder.layers.{}.mlp.fc2.weightzlayers.{}.mlp.w2.weightz)text_model.encoder.layers.{}.mlp.fc2.biaszlayers.{}.mlp.w2.biasz4text_model.encoder.layers.{}.self_attn.q_proj.weightzlayers.{}.attn.q_proj.weightz2text_model.encoder.layers.{}.self_attn.q_proj.biaszlayers.{}.attn.q_proj.biasz4text_model.encoder.layers.{}.self_attn.k_proj.weightzlayers.{}.attn.k_proj.weightz2text_model.encoder.layers.{}.self_attn.k_proj.biaszlayers.{}.attn.k_proj.biasz4text_model.encoder.layers.{}.self_attn.v_proj.weightzlayers.{}.attn.v_proj.weightz2text_model.encoder.layers.{}.self_attn.v_proj.biaszlayers.{}.attn.v_proj.biasz4text_model.encoder.layers.{}.self_attn.out_proj.biaszlayers.{}.attn.output_proj.biasz!layers.{}.attn.output_proj.weightzfinal_norm.weightzfinal_norm.bias)z6text_model.encoder.layers.{}.self_attn.out_proj.weightz"text_model.final_layer_norm.weightz text_model.final_layer_norm.bias>   text_projection.weightvisual_projection.weight"text_model.embeddings.position_idslogit_scalec                     i }|                                  D ]>\  }}|                    d          s	|t          v r$t          |t                    }|||<   ?|S )Nzvision_model.)items
startswith_IGNOREr   _FROM_HF)
state_dictconverted_state_dictkeyvaluenew_keys        z/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/torchtune/models/clip/_convert_weights.pyclip_text_hf_to_tuner   )   si     &&(( . .
U>>/** 	cWnn h//(-W%%    N) torchtune.models.convert_weightsr   r   r   r    r   r   <module>r      s>   < ; ; ; ; ;24L57K 67Q 45M	
 67R 45N 23L 01H 23L 01H ;<Z 9:V ;<Z 9:V ;<Z  9:V!" ;<]#$ ?b*=(9)  .           r   