
     `iT                        d Z ddlmZmZ ddlZddlmZmZ ddl	m
Z
mZmZ ddlmZmZ ddlmZmZmZmZmZmZmZmZmZmZmZmZ dd	lmZmZm Z   e            rddl!Z! e            rddl"Z"dd
l"m#Z#m$Z$ ddl%m&Z&  ej'        e(          Z)	 ddej*        deee+ef                  fdZ,	 ddedeee+ef                  defdZ-defdZ. G d de
          Z/dgZ0dS )z%Image processor class for SuperPoint.    )OptionalUnionN   )is_torch_availableis_vision_available)BaseImageProcessorBatchFeatureget_size_dict)resizeto_channel_dimension_format)ChannelDimension
ImageInput	ImageTypePILImageResamplingget_image_typeinfer_channel_dimension_formatis_pil_imageis_scaled_imageis_valid_imageto_numpy_arrayvalid_imagesvalidate_preprocess_arguments)
TensorTypeloggingrequires_backends)Image	ImageDraw   )KeypointMatchingOutputimageinput_data_formatc                    |t           j        k    r[| j        d         dk    rdS t          j        | d         | d         k              o#t          j        | d         | d         k              S |t           j        k    r[| j        d         dk    rdS t          j        | d         | d	         k              o#t          j        | d	         | d
         k              S d S )Nr   r   Tr   .r   .   ..r   .r   .r&   )r   FIRSTshapenpallLAST)r    r!   s     /home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/transformers/models/efficientloftr/image_processing_efficientloftr.pyis_grayscaler1   5   s     ,222;q>Q4veFmuV}455`"&vRWX^R_A_:`:``	.3	3	3;r?a4veFmuV}455`"&vRWX^R_A_:`:`` 
4	3    returnc                 2   t          t          dg           t          | t          j                  rt          | |          r| S |t          j        k    r>| d         dz  | d         dz  z   | d         dz  z   }t          j        |gd	z  d
          }nM|t          j	        k    r=| d         dz  | d         dz  z   | d         dz  z   }t          j        |gd	z  d          }|S t          | t          j        j                  s| S |                     d          } | S )ao  
    Converts an image to grayscale format using the NTSC formula. Only support numpy and PIL Image. TODO support torch
    and tensorflow grayscale conversion

    This function is supposed to return a 1-channel image, but it returns a 3-channel image with the same value in each
    channel, because of an issue that is discussed in :
    https://github.com/huggingface/transformers/pull/25786#issuecomment-1730176446

    Args:
        image (Image):
            The image to convert.
        input_data_format (`ChannelDimension` or `str`, *optional*):
            The channel dimension format for the input image.
    visionr!   r#   gŏ1w-!?r$   gbX9?r%   gv/?r   r   )axisr(   r)   r*   r'   L)r   convert_to_grayscale
isinstancer-   ndarrayr1   r   r+   stackr/   PILr   convert)r    r!   
gray_images      r0   r9   r9   D   s+   $ *XJ777%$$ 	1BCCC 	L 0 666v/%-&2HH5QW=[aKaaJ:,"2;;;JJ"2"777v/%-&2HH5QW=[aKaaJ:,"2<<<JeSY_-- MM#ELr2   imagesc                    d}d t          | t                    rWt          |           dk    rt          fd| D                       r| S t          fd| D                       rd | D             S t	          |          )N)z-Input images must be a one of the following :z - A pair of PIL images.z - A pair of 3D arrays.z! - A list of pairs of PIL images.z  - A list of pairs of 3D arrays.c                     t          |           pCt          |           o4t          |           t          j        k    ot          | j                  dk    S )z$images is a PIL Image or a 3D array.r   )r   r   r   r   r=   lenr,   )r    s    r0   _is_valid_imagez8validate_and_format_image_pairs.<locals>._is_valid_imaget   sN    E"" 
5!!fnU&;&;y}&LfQTUZU`QaQaefQf	
r2   r&   c              3   .   K   | ]} |          V  d S N .0r    rD   s     r0   	<genexpr>z2validate_and_format_image_pairs.<locals>.<genexpr>{   s-      #Q#Q__U%;%;#Q#Q#Q#Q#Q#Qr2   c              3      K   | ]G}t          |t                    o-t          |          d k    ot          fd|D                       V  HdS )r&   c              3   .   K   | ]} |          V  d S rF   rG   rH   s     r0   rJ   z<validate_and_format_image_pairs.<locals>.<genexpr>.<genexpr>   s-      CCuOOE**CCCCCCr2   N)r:   listrC   r.   )rI   
image_pairrD   s     r0   rJ   z2validate_and_format_image_pairs.<locals>.<genexpr>}   s}       
 
  z4(( DJ1$DCCCC
CCCCC
 
 
 
 
 
r2   c                     g | ]	}|D ]}|
S rG   rG   )rI   rN   r    s      r0   
<listcomp>z3validate_and_format_image_pairs.<locals>.<listcomp>   s%    KKKj
KKuEKKKKr2   )r:   rM   rC   r.   
ValueError)r@   error_messagerD   s     @r0   validate_and_format_image_pairsrS   k   s    M
 
 
 &$ 	Lv;;!#Q#Q#Q#Q&#Q#Q#Q Q QM 
 
 
 
 %	
 
 
 
 
 	L LKFKKKK
]
#
##r2   c                   r    e Zd ZdZdgZddej        dddfdedee	e
ef                  ded	ed
ededdf fdZ	 	 ddej        de	e
ef         deee
ef                  deee
ef                  fdZdddddddej        df	dee         dee	e
ef                  dee         d	ee         d
ee         dee         deee
ef                  dedeee
ef                  defdZ	 d dddeeee         f         dedee	e
ej        f                  fdZdedee	e
ej        f                  ded         fdZd Z xZS )!EfficientLoFTRImageProcessorau  
    Constructs a EfficientLoFTR image processor.

    Args:
        do_resize (`bool`, *optional*, defaults to `True`):
            Controls whether to resize the image's (height, width) dimensions to the specified `size`. Can be overridden
            by `do_resize` in the `preprocess` method.
        size (`Dict[str, int]` *optional*, defaults to `{"height": 480, "width": 640}`):
            Resolution of the output image after `resize` is applied. Only has an effect if `do_resize` is set to
            `True`. Can be overridden by `size` in the `preprocess` method.
        resample (`PILImageResampling`, *optional*, defaults to `Resampling.BILINEAR`):
            Resampling filter to use if resizing the image. Can be overridden by `resample` in the `preprocess` method.
        do_rescale (`bool`, *optional*, defaults to `True`):
            Whether to rescale the image by the specified scale `rescale_factor`. Can be overridden by `do_rescale` in
            the `preprocess` method.
        rescale_factor (`int` or `float`, *optional*, defaults to `1/255`):
            Scale factor to use if rescaling the image. Can be overridden by `rescale_factor` in the `preprocess`
            method.
        do_grayscale (`bool`, *optional*, defaults to `True`):
            Whether to convert the image to grayscale. Can be overridden by `do_grayscale` in the `preprocess` method.
    pixel_valuesTNgp?	do_resizesizeresample
do_rescalerescale_factordo_grayscaler3   c                      t                      j        di | ||nddd}t          |d          }|| _        || _        || _        || _        || _        || _        d S )Ni  i  )heightwidthFdefault_to_squarerG   )	super__init__r
   rW   rX   rY   rZ   r[   r\   )	selfrW   rX   rY   rZ   r[   r\   kwargs	__class__s	           r0   rc   z%EfficientLoFTRImageProcessor.__init__   s|     	""6"""'ttc-J-JTU;;;"	 $,(r2   r    data_formatr!   c                 b    t          |d          }t          |f|d         |d         f||d|S )aL  
        Resize an image.

        Args:
            image (`np.ndarray`):
                Image to resize.
            size (`dict[str, int]`):
                Dictionary of the form `{"height": int, "width": int}`, specifying the size of the output image.
            data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format of the output image. If not provided, it will be inferred from the input
                image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.
            input_data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format for the input image. If unset, the channel dimension format is inferred
                from the input image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.
        Fr`   r^   r_   )rX   rg   r!   )r
   r   )rd   r    rX   rg   r!   re   s         r0   r   z#EfficientLoFTRImageProcessor.resize   sU    : TU;;;
x.$w-0#/	
 

 
 
 	
r2   return_tensorsc                 >   ||n| j         }||n| j        }||n| j        }||n| j        }||n| j        }||n| j        }t          |d          }t          |          }t          |          st          d          t          |||||           d |D             }t          |d                   r|rt                              d           |
t          |d                   }
g |D ]q}|r|                     ||||
	          }|r|                     |||

          }|rt#          ||
          }t%          ||	|
          }                    |           rfdt)          dt+                    d          D             }d|i}t-          ||          S )a   
        Preprocess an image or batch of images.

        Args:
            images (`ImageInput`):
                Image pairs to preprocess. Expects either a list of 2 images or a list of list of 2 images list with
                pixel values ranging from 0 to 255. If passing in images with pixel values between 0 and 1, set
                `do_rescale=False`.
            do_resize (`bool`, *optional*, defaults to `self.do_resize`):
                Whether to resize the image.
            size (`dict[str, int]`, *optional*, defaults to `self.size`):
                Size of the output image after `resize` has been applied. If `size["shortest_edge"]` >= 384, the image
                is resized to `(size["shortest_edge"], size["shortest_edge"])`. Otherwise, the smaller edge of the
                image will be matched to `int(size["shortest_edge"]/ crop_pct)`, after which the image is cropped to
                `(size["shortest_edge"], size["shortest_edge"])`. Only has an effect if `do_resize` is set to `True`.
            resample (`PILImageResampling`, *optional*, defaults to `self.resample`):
                Resampling filter to use if resizing the image. This can be one of `PILImageResampling`, filters. Only
                has an effect if `do_resize` is set to `True`.
            do_rescale (`bool`, *optional*, defaults to `self.do_rescale`):
                Whether to rescale the image values between [0 - 1].
            rescale_factor (`float`, *optional*, defaults to `self.rescale_factor`):
                Rescale factor to rescale the image by if `do_rescale` is set to `True`.
            do_grayscale (`bool`, *optional*, defaults to `self.do_grayscale`):
                Whether to convert the image to grayscale.
            return_tensors (`str` or `TensorType`, *optional*):
                The type of tensors to return. Can be one of:
                    - Unset: Return a list of `np.ndarray`.
                    - `TensorType.TENSORFLOW` or `'tf'`: Return a batch of type `tf.Tensor`.
                    - `TensorType.PYTORCH` or `'pt'`: Return a batch of type `torch.Tensor`.
                    - `TensorType.NUMPY` or `'np'`: Return a batch of type `np.ndarray`.
                    - `TensorType.JAX` or `'jax'`: Return a batch of type `jax.numpy.ndarray`.
            data_format (`ChannelDimension` or `str`, *optional*, defaults to `ChannelDimension.FIRST`):
                The channel dimension format for the output image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - Unset: Use the channel dimension format of the input image.
            input_data_format (`ChannelDimension` or `str`, *optional*):
                The channel dimension format for the input image. If unset, the channel dimension format is inferred
                from the input image. Can be one of:
                - `"channels_first"` or `ChannelDimension.FIRST`: image in (num_channels, height, width) format.
                - `"channels_last"` or `ChannelDimension.LAST`: image in (height, width, num_channels) format.
                - `"none"` or `ChannelDimension.NONE`: image in (height, width) format.
        NFr`   zkInvalid image type. Must be of type PIL.Image.Image, numpy.ndarray, torch.Tensor, tf.Tensor or jax.ndarray.)rW   rX   rY   rZ   r[   c                 ,    g | ]}t          |          S rG   r   rI   r    s     r0   rP   z;EfficientLoFTRImageProcessor.preprocess.<locals>.<listcomp>3       <<<E.''<<<r2   r   zIt looks like you are trying to rescale already rescaled images. If the input images have pixel values between 0 and 1, set `do_rescale=False` to avoid rescaling them again.)r    rX   rY   r!   )r    scaler!   r6   )input_channel_dimc                 *    g | ]}||d z            S r&   rG   )rI   i
all_imagess     r0   rP   z;EfficientLoFTRImageProcessor.preprocess.<locals>.<listcomp>N  s&    SSSz!a!e),SSSr2   r&   rV   )datatensor_type)rW   rY   rZ   r[   r\   rX   r
   rS   r   rQ   r   r   loggerwarning_oncer   r   rescaler9   r   appendrangerC   r	   )rd   r@   rW   rX   rY   rZ   r[   r\   ri   rg   r!   re   r    image_pairsru   rt   s                  @r0   
preprocessz'EfficientLoFTRImageProcessor.preprocess   s,   t "+!6IIDN	'388#-#9ZZt
+9+E4K^'3'?||TEV'ttTYTU;;; 188F## 	:  
 	&!)	
 	
 	
 	
 =<V<<<6!9%% 	* 	s  
 $ >vay I I
 	% 	%E t%dXarss m5Zkll Y,UFWXXX/{VghhhEe$$$$ TSSSeAs:PQ6R6RSSS,>BBBBr2           outputsr   target_sizes	thresholdc                    |j         j        d         t          |          k    rt          d          t	          d |D                       st          d          t          |t                    r!t          j        ||j         j	                  }n3|j        d         dk    s|j        d         dk    rt          d          |}|j
                                        }||                    d                              dddd          z  }|                    t          j                  }g }t!          ||j         |j                  D ]x\  }}}	t          j        |	|k    |dk              }
|d         |
d                  }|d         |
d                  }|	d         |
d                  }|                    |||d	           y|S )
a  
        Converts the raw output of [`KeypointMatchingOutput`] into lists of keypoints, scores and descriptors
        with coordinates absolute to the original image sizes.
        Args:
            outputs ([`KeypointMatchingOutput`]):
                Raw outputs of the model.
            target_sizes (`torch.Tensor` or `List[Tuple[Tuple[int, int]]]`, *optional*):
                Tensor of shape `(batch_size, 2, 2)` or list of tuples of tuples (`Tuple[int, int]`) containing the
                target size `(height, width)` of each image in the batch. This must be the original image size (before
                any processing).
            threshold (`float`, *optional*, defaults to 0.0):
                Threshold to filter out the matches with low scores.
        Returns:
            `List[Dict]`: A list of dictionaries, each dictionary containing the keypoints in the first and second image
            of the pair, the matching scores and the matching indices.
        r   zRMake sure that you pass in as many target sizes as the batch dimension of the maskc              3   <   K   | ]}t          |          d k    V  dS )r&   N)rC   )rI   target_sizes     r0   rJ   zNEfficientLoFTRImageProcessor.post_process_keypoint_matching.<locals>.<genexpr>l  s/      II[3{##q(IIIIIIr2   zTEach element of target_sizes must contain the size (h, w) of each image of the batch)devicer   r&   r'   )
keypoints0
keypoints1matching_scores)matchesr,   rC   rQ   r.   r:   rM   torchtensorr   	keypointscloneflipreshapetoint32zipr   logical_andrz   )rd   r   r   r   image_pair_sizesr   resultskeypoints_pairr   scoresvalid_matchesmatched_keypoints0matched_keypoints1r   s                 r0   post_process_keypoint_matchingz;EfficientLoFTRImageProcessor.post_process_keypoint_matchingT  s   , ? #s<'8'888qrrrIILIIIII 	ustttlD)) 	,$|LAWXXX!!$))\-?-Ba-G-G j    ,%++--	 0 5 5b 9 9 A A"aA N NN	LL--	/29gowOf/g/g 	 	+NGV!-fy.@'B,OOM!/!2=3C!D!/!2=3C!D$Qia(89ONN"4"4'6     r2   r@   keypoint_matching_outputzImage.Imagec           	         t                    d D             fdt          dt                    d          D             }g }t          ||          D ]\  }}|d         j        dd         \  }}|d         j        dd         \  }	}
t          j        t          ||	          ||
z   dft
          j                  }|d         |d|d|f<   |d         |d|	|df<   t          j
        |          }t          j        |          }|d	                             d          \  }}|d
                             d          \  }}t          |||||d                   D ]\  }}}}}|                     |          }|                    ||||z   |f|d           |                    |dz
  |dz
  |dz   |dz   fd           |                    ||z   dz
  |dz
  ||z   dz   |dz   fd           |                    |           |S )a  
        Plots the image pairs side by side with the detected keypoints as well as the matching between them.

        Args:
            images (`ImageInput`):
                Image pairs to plot. Same as `EfficientLoFTRImageProcessor.preprocess`. Expects either a list of 2
                images or a list of list of 2 images list with pixel values ranging from 0 to 255.
            keypoint_matching_output (List[Dict[str, torch.Tensor]]]):
                A post processed keypoint matching output

        Returns:
            `List[PIL.Image.Image]`: A list of PIL images, each containing the image pairs side by side with the detected
            keypoints as well as the matching between them.
        c                 ,    g | ]}t          |          S rG   rl   rm   s     r0   rP   zLEfficientLoFTRImageProcessor.visualize_keypoint_matching.<locals>.<listcomp>  rn   r2   c                 *    g | ]}||d z            S rr   rG   )rI   rs   r@   s     r0   rP   zLEfficientLoFTRImageProcessor.visualize_keypoint_matching.<locals>.<listcomp>  s&    KKKQva!a%i(KKKr2   r   r&   Nr   r   )dtyper   r   r   )fillr_   black)r   )rS   r{   rC   r   r,   r-   zerosmaxuint8r   	fromarrayr   Drawunbind
_get_colorlineellipserz   )rd   r@   r   r|   r   rN   pair_outputheight0width0height1width1
plot_imageplot_image_pildrawkeypoints0_xkeypoints0_ykeypoints1_xkeypoints1_ykeypoint0_xkeypoint0_ykeypoint1_xkeypoint1_ymatching_scorecolors    `                      r0   visualize_keypoint_matchingz8EfficientLoFTRImageProcessor.visualize_keypoint_matching  s}   & 188<<V<<<KKKK%3v;;2J2JKKK'*;8P'Q'Q 	+ 	+#J(m1"1"5OGV(m1"1"5OGV3w#8#8&6/1"MUWU]^^^J,6qMJxx&(),6qMJxx()"_Z88N>.11D)4\)B)I)I!)L)L&L,)4\)B)I)I!)L)L&L,VYlL,TeHfW W  R[+{N 77		 +{V/C[Q    
 kAo{QaQ\_`Q`ahoppp 6)A-{Qf@TWX@XZehiZij      
 NN>****r2   c                 ^    t          dd|z
  z            }t          d|z            }d}|||fS )zMaps a score to a color.   r   r   )int)rd   scorergbs        r0   r   z'EfficientLoFTRImageProcessor._get_color  s:    q5y!""e1ayr2   )NN)r~   ) __name__
__module____qualname____doc__model_input_namesr   BILINEARboolr   dictstrr   floatrc   r-   r;   r   r   r   r+   r   r	   r}   rM   tupler   Tensorr   r   r   r   __classcell__)rf   s   @r0   rU   rU      s        , (( )-'9'B '!) )) tCH~&) %	)
 ) ) ) 
) ) ) ) ) )4 ?CDH%
 %
z%
 38n%
 eC)9$9:;	%

 $E#/?*?$@A%
 %
 %
 %
V %))-15%)*.'+;?(8(>DHtC tC D>tC tCH~&	tC
 -.tC TNtC !tC tntC !sJ!78tC &tC $E#/?*?$@AtC 
tC tC tC tCt 	9 9)9 JU349 	9
 
d3$%	&9 9 9 9v44 #'tC,='>"?4 
m		4 4 4 4l      r2   rU   rF   )1r   typingr   r   numpyr-    r   r   image_processing_utilsr   r	   r
   image_transformsr   r   image_utilsr   r   r   r   r   r   r   r   r   r   r   r   utilsr   r   r   r   r=   r   r   modeling_efficientloftrr   
get_loggerr   rw   r;   r   r1   r9   rS   rU   __all__rG   r2   r0   <module>r      s   , + " " " " " " " "     7 7 7 7 7 7 7 7 U U U U U U U U U U C C C C C C C C                            < ; ; ; ; ; ; ; ; ;  LLL @JJJ$$$$$$$$??????		H	%	% AEa a:ac+;&; <=a a a a" AE# ##c+;&; <=# # # # #N$J $ $ $ $8C C C C C#5 C C CL
 *
*r2   