§
    ÇPƒiO  ã            	       óÎ  — U d dl Z d dlmZmZmZmZmZmZ d dlZd dl	m
Z
 d dlmZ  e
¦   «         Zej        ej        ej        ej        dœZeeej        f         ed<   dded	dfd
„Zd	efd„Z	 ddee         deej                 d	ej        fd„Ze j        dej        d	ed         fd„¦   «         Z	 ddeeeej        j        f                  dej        deee                  d	dfd„ZdS )é    N)ÚDictÚ	GeneratorÚIterableÚListÚOptionalÚTuple)Ú
get_logger)Úis_npu_available)Úfp16Úbf16Úfp32Úfp64ÚPRECISION_STR_TO_DTYPEÚhighÚ	precisionÚreturnc                 óä   — t           j                             ¦   «         s	t          sdS t          j        | ¦  «         | dk    rdt           j        j        _        dS dt           j        j        _        dS )a¼  Sets the precision of float32 matrix multiplications and convolution operations.

    For more information, see the PyTorch docs:
    - https://pytorch.org/docs/stable/generated/torch.set_float32_matmul_precision.html
    - https://pytorch.org/docs/stable/backends.html#torch.backends.cudnn.allow_tf32

    Args:
        precision (str): The setting to determine which datatypes to use for matrix multiplication and convolution operations.
    NÚhighestFT)ÚtorchÚcudaÚis_availabler
   Úset_float32_matmul_precisionÚbackendsÚcudnnÚ
allow_tf32)r   s    úp/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/torchtune/training/precision.pyÚ_set_float32_precisionr      si   € õ ŒJ×#Ò#Ñ%Ô%ð Õ)9ð Øˆå	Ô& yÑ1Ô1Ð1àIÒÐØ*/ŒÔÔ'Ð'Ð'à*.ŒÔÔ'Ð'Ð'ó    c                  ób  — t           j                             ¦   «         obt           j                             ¦   «         oDt           j                             ¦   «         o&t           j        j                             ¦   «         dk    } t           j        j	                             ¦   «         o"t           j        j	         
                    ¦   «         }t          ot           j                             ¦   «         }t           j                             ¦   «         ot           j                             ¦   «         }| p|p|p|S )aË  
    Check that bf16 is available on this hardware. Requirements:
        - CUDA is available and supports bf16
            - CUDA version >= 11
            - CUDA compute capability >= 8
        - NCCL is available and version >= 2.10
        - MPS is available and torch was built with MPS
        - NPU is available and supports bf16
        - XPU is available and supports bf16

    Returns:
        bool: True if bf16 is available, False otherwise.

    )é   é
   )r   r   r   Úis_bf16_supportedÚdistributedÚis_nccl_availableÚncclÚversionr   ÚmpsÚis_builtr
   ÚnpuÚxpu)Úcuda_supportÚmps_supportÚnpu_supportÚxpu_supports       r   Úverify_bf16_supportr/   0   sç   € õ  	Œ
×ÒÑ!Ô!ð 	1ÝŒJ×(Ò(Ñ*Ô*ð	1åÔ×/Ò/Ñ1Ô1ð	1õ ŒJŒO×#Ò#Ñ%Ô%¨Ò0ð	 õ ”.Ô$×1Ò1Ñ3Ô3ÐU½¼Ô8J×8SÒ8SÑ8UÔ8U€KÝ"ÐD¥u¤y×'BÒ'BÑ'DÔ'D€KÝ”)×(Ò(Ñ*Ô*ÐL­u¬y×/JÒ/JÑ/LÔ/L€KØÐD˜;ÐD¨+ÐD¸ÐDr   ÚdtypeÚdevicec                 ó²  — | €t           j        S t                               | | ¦  «        }|t                               ¦   «         vrMt          d|› dd                     t          t                               ¦   «         ¦  «        ¦  «        › d¦  «        ‚|t           j	        k    r5|t          j
        d¦  «        k    rt          ¦   «         st          d¦  «        ‚|S )aÕ  Get the torch.dtype corresponding to the given precision string. If no string is passed,
    we will default to torch.float32.

    Note:
        If bf16 precision is requested with a CUDA device, we verify whether the device indeed supports
        bf16 kernels. If not, a ``RuntimeError`` is raised.

    Args:
        dtype (Optional[str]): The precision dtype. Default: ``None``, in which we default to torch.float32
        device (Optional[torch.device]): Device in use for training. Only CUDA and CPU
            devices are supported. If a CUDA device is passed in, additional checking is done
            to ensure that the device supports the requested precision. Default: ``None``, in which case
            a CUDA device is assumed.
    Raises:
        ValueError: if precision isn't supported by the library
        RuntimeError: if bf16 precision is requested but not available on this hardware.

    Returns:
        torch.dtype: The corresponding torch.dtype.

    NzDtype z must be one of z, z for finetuning.Úcpuzcbf16 precision was requested but not available on this hardware. Please use fp32 precision instead.)r   Úfloat32r   ÚgetÚvaluesÚ
ValueErrorÚjoinÚlistÚkeysÚbfloat16r1   r/   ÚRuntimeError)r0   r1   Útorch_dtypes      r   Ú	get_dtyper>   K   sÜ   € ð4 €}ÝŒ}Ðõ )×,Ò,¨U°EÑ:Ô:€Kð Õ0×7Ò7Ñ9Ô9Ð9Ð9ÝØr[ÐrÐr°$·)²)½DÕAW×A\ÒA\ÑA^ÔA^Ñ<_Ô<_Ñ2`Ô2`ÐrÐrÐrñ
ô 
ð 	
ð
 	•u”~Ò%Ð%Ø•e”l 5Ñ)Ô)Ò)Ð)Ý#Ñ%Ô%ð *õ Øqñ
ô 
ð 	
ð Ðr   )NNNc              #   ó¼   K  — t          j        ¦   «         }t          j        | ¦  «         	 dV — t          j        |¦  «         dS # t          j        |¦  «         w xY w)a…  
    Context manager to set torch's default dtype.

    Args:
        dtype (torch.dtype): The desired default dtype inside the context manager.

    Returns:
        ContextManager: context manager for setting default dtype.

    Example:
        >>> with set_default_dtype(torch.bfloat16):
        >>>     x = torch.tensor([1, 2, 3])
        >>>     x.dtype
        torch.bfloat16


    N)r   Úget_default_dtypeÚset_default_dtype)r0   Ú	old_dtypes     r   rA   rA   }   sc   è è € õ& Ô'Ñ)Ô)€IÝ	Ô˜EÑ"Ô"Ð"ð+ØˆˆˆåÔ 	Ñ*Ô*Ð*Ð*Ð*øÔ 	Ñ*Ô*Ð*Ð*øøøs   «A ÁAÚnamed_paramsÚexclude_param_namesc           	      ó¤   ‡— | D ]K\  Š}|t          ˆfd„|D ¦   «         ¦  «        rŒ#|j        |k    rt          d‰› d|j        › d|› ¦  «        ‚ŒLdS )a¦  
    Validates that all input parameters have the expected dtype.

    Args:
        named_params (Iterable[Tuple[str, torch.nn.Parameter]]): Iterable of named parameters.
        dtype (torch.dtype): Expected dtype.
        exclude_param_names (Optional[List[str]]): Optional list of parameter names to exclude from dtype checking

    Raises:
        ValueError: If any parameter has a different dtype than `dtype`.
    Nc              3   ó    •K  — | ]}|‰v V — Œ	d S ©N© )Ú.0ÚnÚnames     €r   ú	<genexpr>z0validate_expected_param_dtype.<locals>.<genexpr>ª   s'   øè è € Ð:Ð: 1˜9Ð:Ð:Ð:Ð:Ð:Ð:r   z
Parameter z has dtype z, but expected )Úanyr0   r7   )rC   r0   rD   ÚparamrK   s       @r   Úvalidate_expected_param_dtyperO   ˜   s’   ø€ ð  $ð ð ‰ˆˆeØÐ*ÝÐ:Ð:Ð:Ð:Ð&9Ð:Ñ:Ô:Ñ:Ô:ð ØØŒ;˜%ÒÐÝØQ˜TÐQÐQ¨e¬kÐQÐQÈ%ÐQÐQñô ð ð  ð	ð r   )r   )NNrG   ) Ú
contextlibÚtypingr   r   r   r   r   r   r   Útorchtune.utilsr	   Útorchtune.utils._devicer
   ÚlogÚfloat16r;   r4   Úfloat64r   Ústrr0   Ú__annotations__r   Úboolr/   r1   r>   ÚcontextmanagerrA   ÚnnÚ	ParameterrO   rH   r   r   ú<module>r]      sð  ðð Ð Ð Ð Ð Ø CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ CÐ Cà €€€à &Ð &Ð &Ð &Ð &Ð &Ø 4Ð 4Ð 4Ð 4Ð 4Ð 4à€jl„l€ð ŒMØŒNØŒMØŒMð	2ð 2Ð ˜˜S %¤+Ð-Ô.ð ð ñ ð/ð / cð /°tð /ð /ð /ð /ð,E˜Tð Eð Eð Eð Eð8 CGð/ð /ØCŒ=ð/Ø)1°%´,Ô)?ð/à
„[ð/ð /ð /ð /ðd Ôð+˜Uœ[ð +¨YÐ7GÔ-Hð +ð +ð +ñ Ôð+ð: 04ðð Ø˜5  e¤hÔ&8Ð!8Ô9Ô:ðàŒ;ðð " $ s¤)Ô,ðð 
ð	ð ð ð ð ð r   