§
    *`ƒi  م            
       َ<  — d dl mZmZ d dlZd dlmZmZ d dlmZm	Z	m
Z
 d dlmZ d dlmZ dgZ	 ddee         d	ee         d
ee         defd„Z	 	 ddej        j        d
ee         dee         fd„Z	 	 ddej        j        d
ee         dee         dee         fd„ZdS )é    )عListعOptionalN)عCompressionFormatعSparsityStructure)عQuantizationArgsعQuantizationStrategyعQuantizationType)عis_module_quantized)عloggerع,infer_and_set_per_module_quantization_formatع
input_argsعweight_argsعsparsity_structureعreturnc                 َژ  — t          |¦  «        t           j        k    }|duo| du }|j        dk    r=|j        t          j        j        k    r#|j        dk    rt          j	        S t          j
        S |rt|j        dv o|j        t          j        j        k    }|st          j        S |r5|j        t          j        j        t          j        j        fv rt          j        S t          j        S |j        t          j        j        k    r|j        dk    rt          j        S |j        t          j        j        k    rt          j        S t          j        S )a   
    Using the weight and input quantization args as well as an optional
    sparsity structure, determine the compression format that should be
    applied to a given module

    :param input_args: input quantization parameters
    :param weight_args: weight quantization parameters
    :param sparsity_structure: optional (global) modle sparsity
        structure
    :return CompresssionFormat for the module
    Né   é    )r   é   r   )r   عTWO_FOURعnum_bitsعtyper	   عFLOATعvalueع
group_sizer   عmxfp4_pack_quantizedعnvfp4_pack_quantizedعINTعnaive_quantizedعstrategyr   عCHANNELعGROUPع	marlin_24عpack_quantizedعfloat_quantizedعint_quantized)r   r   r   عis_24_structureعis_weight_onlyعis_valid_packs         ْt/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/compressed_tensors/config/format.pyع_get_quant_compression_formatr*      sO  € ُ" 	ذ,ر-ش-ص1Bش1KزKً ً !¨ذ,ذC°¸tذ1C€Nàشکqز ذ  [ش%5ص9Iش9Oش9Uز%Uذ%Uطش! Rز'ذ'ف$ش9ذ9ف ش5ذ5àً 1àش  Fذ*ً ?طش ص$4ش$8ش$>ز>ً 	ً ً 	5ف$ش4ذ4àً 	/ک{ش3ف ش(ش.ف ش&ش,ً8
ً  
ً  
ُ %ش.ذ.ف ش/ذ/ً شص 0ش 6ش <ز<ذ<طش$¨ز)ذ)ه$ش4ذ4طشص/ش3ش9ز9ذ9ف$ش2ذ2ه ش0ذ0َ    عmoduleعquantization_formatc                 َR  — | j         j        }| j         j        }|€dS t          |||¦  «        }|پ-||j        k    rt          j        d¦  «         || j         _        dS | j         j        پ-| j         j        |j        k    rt          j        d¦  «         dS dS |j        | j         _        dS )a[  
    Determine and set the per module quantization format given quantization args
    and sparsity structure.

    :param module: module which has its quantization inferred
    :param sparsity_structure: optional sparsity applied to the module
    :param quantization_format: optional global format to override
        the per module formats

    Nz\The provided format for the module does not match the inferred format. Compression may fail )عquantization_schemeعweightsعinput_activationsr*   r   r   عwarningعformat)r,   r   r-   عweight_schemeعinput_schemeعcompression_formats         r)   عset_per_module_formatr7   V   sن   € ً ش.ش6€Mطش-ش?€Lطذطˆف6طگmذ%7ٌô ذً ذ&طذ"4ش":ز:ذ:فŒNً9ٌô ً ً -@ˆش"ش)ذ)ذ)à	ش	#ش	*ذ	6àش%ش,ذ0Bش0HزHذHفŒNً9ٌô ً ً ً ً IذHً -?ش,Dˆش"ش)ذ)ذ)r+   عmodelc                 َX  — g }|                       ¦   «         D ]m}t          |¦  «        r\t          |d¦  «        sJ ‚t          |||¦  «         |j        j        r-|j        j        |vr|                     |j        j        ¦  «         Œnt          |¦  «        dk    r|S t          j	        j
        gS )a“  
    Infers the quantization format for a model based on its state and provided
    compression arguments. Updates thhe quantization_scheme.format value
    based on the inferred format. Returns the unique list of formats in the model.
    All None formats are mapped to CompressionFormat.dense.value

    For a summary of the formats, see `docs/guides/compression_formats.md`.

    :param model: model to check for quantization
    :param sparsity_structure: optional sparsity applied to the module
    :param quantization_format: optional global format to override
        the per module formats
    :return compression format appropriate for the model
    r/   r   )عmodulesr
   عhasattrr7   r/   r3   عappendعlenr   عdenser   )r8   r   r-   عunique_formatsع	submodules        r)   r   r   ƒ   sء   € ً& €Nط—]’]‘_”_ً Lً Lˆ	فکyر)ش)ً 	Lفک9ذ&;ر<ش<ذ<ذ<ذ<ف! )ذ-?ذATرUشUذUàش-ش4ًLàش1ش8ہذNذNà×%ز% iش&Cش&JرKشKذKّه
ˆ>رشکQزذطذفش#ش)ذ*ذ*r+   )N)NN)عtypingr   r   عtorchعcompressed_tensors.configr   r   عcompressed_tensors.quantizationr   r   r	   ع%compressed_tensors.quantization.utilsr
   عlogurur   ع__all__عstrr*   عnnعModuler7   r   © r+   r)   ْ<module>rL      s¥  ًً "ذ !ذ !ذ !ذ !ذ !ذ !ذ !à €€€ط Jذ Jذ Jذ Jذ Jذ Jذ Jذ Jًً ً ً ً ً ً ً ً ً ً
 Fذ Eذ Eذ Eذ Eذ Eط ذ ذ ذ ذ ذ ً :ذ
:€ً )-ً41ً 41طذ)ش*ً41àذ*ش+ً41ً ! œً41ً ً	41ً 41ً 41ً 41ًr )-ط)-ً*Eً *EطŒHŒOً*Eà  œً*Eً " #œً*Eً *Eً *Eً *Eً^ )-ط)-ً +ً  +طŒ8Œ?ً +à  œً +ً " #œً +ً 
ˆ#„Yً	 +ً  +ً  +ً  +ً  +ً  +r+   