Ë
    ’'}h<o  ã                   óÖ  — d dl Z d dlZd dlZd dlZd dlmZ d dlmc mc mZ	 d dl
mZ d dlmZmZmZmZmZmZmZmZ ddlmZmZ d dlmZmZ d dlmZmZmZmZm Z m!Z! d dl"m#Z# d d	l$m%Z% d d	l$m%Z& g d
¢Z'ejP                  ejR                  jP                  ejT                  ejR                  jT                  iejR                  jP                  ej                  jP                  ejR                  jT                  ej                  jT                  idœZ+d„ Z,	 d!d„Z-d"d„Z.d„ Z/d„ Z0d#d„Z1d$d„Z2d„ Z3d„ Z4	 	 	 d%d„Z5d„ Z6d„ Z7d&d„Z8dejr                  ddfd„Z:d&d„Z;d#d„Z<	 	 d'd„Z=	 	 d(d„Z>d„ Z?d)d „Z@y)*é    N)Ú_FusedModule)Ú)get_default_dynamic_quant_module_mappingsÚ(get_default_static_quant_module_mappingsÚ2get_default_static_quant_reference_module_mappingsÚget_default_qat_module_mappingsÚ$get_default_qconfig_propagation_listÚno_observer_setÚ_has_special_act_post_processÚ_get_special_act_post_processé   )Úget_qparam_dictÚ)has_no_children_ignoring_parametrizations)ÚDeQuantStubÚQuantWrapper)Ú_add_module_to_qconfig_obs_ctrÚdefault_dynamic_qconfigÚfloat16_dynamic_qconfigÚ!float_qparams_weight_only_qconfigÚ&float_qparams_weight_only_qconfig_4bitÚ_activation_is_memoryless)Útype_before_parametrizations)Ú_is_activation_post_process)
Úget_default_custom_config_dictÚpropagate_qconfig_Úadd_quant_dequantÚprepareÚquantizeÚquantize_dynamicÚprepare_qatÚquantize_qatÚconvertÚswap_module)Ú%float_to_observed_custom_module_classÚ)observed_to_quantized_custom_module_classc                  ó   — t         S )z,Defines the default custom config dict.
    )Ú_DEFAULT_CUSTOM_CONFIG_DICT© ó    ú]/var/www/html/test/engine/venv/lib/python3.12/site-packages/torch/ao/quantization/quantize.pyr   r   =   s
   € ô 'Ð&r(   c                 óÔ  — |j                  t        | «      |«      }|j                  ||«      }t        | d|«      }t        j                  j
                  j                  j                  || «       t        || «      }|| _        | j                  «       D ]T  \  }}|r|dz   |z   n|}	|3||j                  dg «      v rŒ)t        |«      |j                  dg «      v rŒGt        ||||	«       ŒV y)aò  This is a helper function for `propagate_qconfig_`

    Args:
        module: input module
        qconfig_dict: dictionary that maps from name of submodule to quantization
                     configuration
        qconfig_parent: quantization config of parent module, we will fallback to
                       this config when there is no specified config for current
                       module
        prefix: corresponding prefix of the current module, used as key in
                qconfig_dict
        prepare_custom_config_dict: dictionary for custom handling of modules
                                    see docs for :func:`~torch.ao.quantization.prepare_fx`

    Return:
        None, module is modified inplace with qconfig attached
    Úqconfigú.NÚnon_traceable_module_nameÚnon_traceable_module_class)Úgetr   ÚgetattrÚtorchÚaoÚquantizationr+   Ú_assert_valid_qconfigr   Únamed_childrenÚtypeÚ_propagate_qconfig_helper)
ÚmoduleÚqconfig_dictÚqconfig_parentÚprefixÚprepare_custom_config_dictÚmodule_qconfigÚqconfig_with_device_checkÚnameÚchildÚmodule_prefixs
             r)   r7   r7   B   sê   € ð( "×%Ñ%Ô&BÀ6Ó&JÈNÓ[€NØ!×%Ñ% f¨nÓ=€NÜ˜V Y°Ó?€Nä	‡HH×Ñ×!Ñ!×7Ñ7¸ÈÔOä >¸~ÈvÓ VÐØ.€F„Nà×,Ñ,Ó.ò 	‰ˆˆeÙ/5˜ ™ tÒ+¸4ˆà%Ð-ØÐ.×2Ñ2Ð3NÐPRÓSÒSÜE‹{Ð8×<Ñ<Ð=YÐ[]Ó^Ò^ä%Ø|Ð%>Àõñ	r(   c                 ó0   — |€i }|€i }t        | ||¬«       y)a“  Propagate qconfig through the module hierarchy and assign `qconfig`
    attribute on each leaf module

    Args:
        module: input module
        qconfig_dict: dictionary that maps from name or type of submodule to
            quantization configuration, qconfig applies to all submodules of a
            given module unless qconfig for the submodules are specified (when
            the submodule already has qconfig attribute)
        prepare_custom_config_dict: dictionary for custom handling of modules
            see docs for :func:`~torch.ao.quantization.prepare_fx`

    Return:
        None, module is modified inplace with qconfig attached
    N)r<   )r7   )r8   r9   r<   s      r)   r   r   j   s(   € ð  ÐØˆØ!Ð)Ø%'Ð"Ü˜f lÐOiÖjr(   c                 ó$   — | j                  |«      S )z3Forward hook that calls observer on the output
    ©Úactivation_post_process)ÚselfÚinputÚoutputs      r)   Ú_observer_forward_hookrI   €   s   € ð ×'Ñ'¨Ó/Ð/r(   c                 ó*   — | j                  |d   «      S )z7Forward pre hook that calls observer on the output
    r   rD   )rF   rG   s     r)   Ú_observer_forward_pre_hookrK   …   s   € ð ×'Ñ'¨¨a©Ó1Ð1r(   Fc                 óŒ   — t        | d«      sJ d«       ‚|r| j                  t        d¬«      }y | j                  t        d¬«      }y )NrE   zGExpect activation_post_process attribute already attached to the moduleT)Úprepend)ÚhasattrÚregister_forward_pre_hookrK   Úregister_forward_hookrI   )r8   Úpre_hookÚhandles      r)   Ú&_register_activation_post_process_hookrS   Š   sX   € Ü6Ð4Ô5ð RØQóRÐ5áØ×1Ñ1Ü&°ð 2ó 
‰ð ×-Ñ-Ü"¨Dð .ó 
‰r(   c                 ój  ‡‡‡— |€
t        «       }|€i }‰€Gt        | «      }t        |«      dk  s
J d|› «       ‚t        |«      dkD  rt        t	        |«      «      ndŠdd„Šd„ Šdˆˆˆfd„	}| j                  «       D ]m  \  }}t        |«      t        j                  fv rŒ$t        t        |«      t        j                  t        j                  f«      rB ‰|«      sŒ`t        |d«      sJ d	t        |«      › d
«       ‚ ‰|j                  ‰«      |_        Œ™t!        |t"        «      r ‰|«      sŒ² ||«       Œ»|t        |«      |v r ‰|«      sŒÓ ||«       ŒÜt%        |«      rt'        |«      }	 |||	«       Œü ‰|«      r[t        |«      |v rN|t        |«         j)                  |«      }
t+        | ||
«       |t        |«         t-        «       vsŒU ||
«       Œ_t/        |||‰|«       Œp t1        | «      r<t!        | t2        j                  j4                  «      st        | «      |v r	 || «       yyyy)as  Add observer for the leaf child of the module.

    This function insert observer module to all leaf child module that
    has a valid qconfig attribute.

    Args:
        module: input module with qconfig attributes for all the leaf modules that we want to quantize
        qconfig_propagation_list: a list of quantizable modules that will have observers added to them
            if they are leaf nodes
        device: parent device, if any
        non_leaf_module_list: list of non-leaf modules we want to add observer

    Return:
        None, module is modified inplace with added observer modules and forward_hooks
    Nr   zR_add_observer_ only works with cpu or single-device CUDA modules, but got devices r   c                 ó^   — |€| j                  «       n |«       }||j                  |«       |S ©N)Ú
activationÚto)r+   ÚdeviceÚspecial_act_post_processrW   s       r)   Úget_activation_post_processz3_add_observer_.<locals>.get_activation_post_processµ   s3   € Ø-EÐ-MW×'Ñ'Ô)ÑSkÓSmˆ
ØÐØM‰M˜&Ô!ØÐr(   c                 ó:   — t        | d«      xr | j                  d uS )Nr+   ©rN   r+   )Úms    r)   Úneeds_observationz)_add_observer_.<locals>.needs_observation»   s   € Üq˜)Ó$Ò>¨¯©¸$Ð)>Ð>r(   c                 óÂ   •—  ‰| «      rVt        | t        «      sE| j                  d ‰| j                  ‰|«      «       t	        | t        | j                  «      ¬«       yyy)zn Adds an activation post process module and register
        a pre or post hook that calls the module
        rE   ©rQ   N)Ú
isinstancer   Ú
add_moduler+   rS   r   )r^   rZ   rY   r[   r_   s     €€€r)   Úinsert_activation_post_processz6_add_observer_.<locals>.insert_activation_post_process¾   s[   ø€ ñ
 ˜QÔ¬
°1´kÔ(BàL‰LÐ2Ñ4OØ—	‘	˜6Ð#;ó5=ô >ô 3°1Ô?XÐYZ×YbÑYbÓ?cÖdð )CÐr(   rE   zfunctional class z- has no pre-defined `activation_post_process`rV   )r   Ú_get_unique_devices_ÚlenÚnextÚiterr5   r   ÚnnÚDropoutÚ
issubclassÚnnqÚFloatFunctionalÚQFunctionalrN   r+   rE   rb   r   r
   r   Ú
from_floatÚsetattrr	   Ú_add_observer_r   r1   Ú
Sequential)r8   Úqconfig_propagation_listÚnon_leaf_module_listrY   Úcustom_module_class_mappingÚdevicesrd   r?   r@   rZ   Úobserved_childr[   r_   s      `       @@r)   rq   rq   —   s=  ú€ ð   Ð'Ü#GÓ#IÐ à"Ð*Ø&(Ð#ð €~Ü& vÓ.ˆÜ7‹|˜qÒ ð 	
Ø`ÐahÐ`iÐjó	
Ð ô ),¨G«°qÒ(8””d˜7“mÔ$¸dˆóò?÷eð ×,Ñ,Ó.ó w‰ˆˆeä'¨Ó.´2·:±:°,Ñ>ØÜÔ4°UÓ;¼c×>QÑ>QÔSV×SbÑSbÐ=cÔdÙ  Õ'Ü˜uÐ&?Ô@ð Ø'Ô(DÀUÓ(KÐ'LÐLyÐzóÐ@ñ 1LÈEÏMÉMÐ[aÓ0bÕ-Ü˜œ|Ô,á  Õ'Ù.¨uÕ5Ø!Ð-Ô2NÈuÓ2UÐYmÑ2mÙ  Õ'Ù.¨uÕ5Ü*¨5Ô1Ü'DÀUÓ'KÐ$Ù*¨5Ð2JÕKÙ˜uÔ%Ô*FÀuÓ*MÐQlÑ*lØ8Ô9UÐV[Ó9\Ñ]×hÑhÐinÓoˆNÜF˜D .Ô1ð +Ô+GÈÓ+NÑOÔWfÓWhÓhÙ.¨~Ö>ä˜5Ð":Ð<PÐRXÐZuÖvð9wô@ 1°Ô8ÄÈFÔTY×T\ÑT\×TgÑTgÔAhÜ'¨Ó/Ð3KÑKÙ& vÕ.ð Lð BiÐ8r(   c                 ó¸   — | j                  «       D ch c]  }|j                  ’Œ c}| j                  «       D ch c]  }|j                  ’Œ c}z  S c c}w c c}w rV   )Ú
parametersrY   Úbuffers)r8   Úps     r)   re   re   ï   sF   € Ø$×/Ñ/Ó1Ö2˜ˆAH‹HÒ2Ø!Ÿ>™>Ó+Ö,aˆ‹Ò,ñ-ð -ùÒ2ùÚ,s
   “AºAc                 óÂ   — t        | «      r#t        | d«      r| j                  rt        | «      S | j	                  «       D ]  \  }}t        |«      | j                  |<   Œ | S )a{  Wrap the leaf child module in QuantWrapper if it has a valid qconfig
    Note that this function will modify the children of module inplace and it
    can return a new module which wraps the input module as well.

    Args:
        module: input module with qconfig attributes for all the leaf modules
        that we want to quantize

    Return:
        Either the inplace modified module with submodules wrapped in
        `QuantWrapper` based on qconfig or a new `QuantWrapper` module which
        wraps the input module, the latter case only happens when the input
        module is a leaf module and we want to quantize it.
    r+   )r   rN   r+   r   r5   r   Ú_modules)r8   r?   r@   s      r)   r   r   ó   s]   € ô 1°Ô8¼WÀVÈYÔ=WÐ\b×\jÒ\jÜ˜FÓ#Ð#à×,Ñ,Ó.ò 9‰ˆˆeÜ 1°%Ó 8ˆ‰˜Òð9à€Mr(   c                 ól  — t         j                  j                  d«       |€
t        «       }|j	                  di «      }|st        j                  | «      } |}|€
t        «       }t        | d¬«       t        d„ | j                  «       D «       «      st        j                  d«       t        | |||¬«       | S )aƒ  Prepares a copy of the model for quantization calibration or quantization-aware training.

    Quantization configuration should be assigned preemptively
    to individual submodules in `.qconfig` attribute.

    The model will be attached with observer or fake quant modules, and qconfig
    will be propagated.

    Args:
        `model`: input model to be modified in-place
        `inplace`: carry out model transformations in-place, the original module is mutated
        `allow_list`: list of quantizable modules
        `observer_non_leaf_module_list`: list of non-leaf modules we want to add observer
        `prepare_custom_config_dict`: customization configuration dictionary for prepare function

    .. code-block:: python

       # Example of prepare_custom_config_dict:
       prepare_custom_config_dict = {
           # user will manually define the corresponding observed
           # module class which has a from_float class method that converts
           # float custom module to observed custom module
           "float_to_observed_custom_module_class": {
               CustomModule: ObservedCustomModule
           }
        }

    z!quantization_api.quantize.prepareNr#   ©r9   c              3   óP   K  — | ]  }t        |d «      xr |j                  –— Œ  y­w)r+   Nr]   )Ú.0r^   s     r)   ú	<genexpr>zprepare.<locals>.<genexpr>7  s#   è ø€ ÒL°qŒwq˜)Ó$Ò2¨¯©Ó2ÑLùs   ‚$&z¬None of the submodule got qconfig applied. Make sure you passed correct configuration through `qconfig_dict` or by assigning the `.qconfig` attribute directly on submodules)ru   )r1   Ú_CÚ_log_api_usage_oncer   r/   ÚcopyÚdeepcopyr   r   ÚanyÚmodulesÚwarningsÚwarnrq   )ÚmodelÚinplaceÚ
allow_listÚobserver_non_leaf_module_listr<   ru   rs   s          r)   r   r   	  s´   € ô> 
‡HH× Ñ Ð!DÔEØ!Ð)Ü%CÓ%EÐ"Ø"<×"@Ñ"@ÐAhÐjlÓ"mÐáÜ—‘˜eÓ$ˆð  *ÐØÐÜ#GÓ#IÐ Üu¨4Õ0ô ÑL¸E¿M¹M»OÔLÔLÜ‰ð Uô 	Vô ØÐ'Ð)FØ$?õAð €Lr(   c                 ó   ‡ — t        ‰ d«      r!t        ‰ j                  «      rt        ‰ d«       dˆ fd„	} |d¬«        |d¬«       y )NrE   Fc                 óö   •— | r‰j                   n‰j                  }| rt        nt        }t	        «       }|j                  «       D ]  \  }}||u sŒ|j                  |«       Œ |D ]  }|j                  |«       Œ y rV   )Ú_forward_pre_hooksÚ_forward_hooksrK   rI   ÚsetÚitemsÚaddÚpop)rQ   Úhook_mapÚobserver_hookÚhandle_ids_to_removeÚ	handle_idÚhook_fnr8   s         €r)   Úremove_hooksz5_remove_activation_post_process.<locals>.remove_hooksI  sy   ø€ Ù086×,Ò,¸f×>SÑ>SˆÙ6>Õ2ÔDZˆÜ"›uÐØ"*§.¡.Ó"2ò 	4ÑˆIwØ˜-Ò'Ø$×(Ñ(¨Õ3ð	4ð .ò 	$ˆIØL‰L˜Õ#ñ	$r(   Tra   ©F)rN   r   rE   Údelattr)r8   rœ   s   ` r)   Ú_remove_activation_post_processrŸ   A  s@   ø€ ô ˆvÐ0Ô1Ü" 6×#AÑ#AÔBÜÐ1Ô2õ$ñ ˜$ÕÙ˜%Ö r(   c                 óv   — | j                  «       D ]  }t        |«       Œ t        | d«      r| `t	        | «       y)zŠClean up the qconfig left in the module so that new qconfig can be
    propagated.

    Args:
        module: module to be cleaned up
    r+   N)ÚchildrenÚ_remove_qconfigrN   r+   rŸ   )r8   r@   s     r)   r¢   r¢   W  s;   € ð —‘Ó"ò ˆÜ˜Õðô ˆvyÔ!ØˆNä# FÕ+r(   c                 óò   — t         j                  j                  d«       |€
t        «       }|st	        j
                  | «      } | j                  «        t        | d¬«        || g|¢­Ž  t        | |d¬«       | S )aƒ  Quantize the input float model with post training static quantization.

    First it will prepare the model for calibration, then it calls
    `run_fn` which will run the calibration step, after that we will
    convert the model to a quantized model.

    Args:
        model: input float model
        run_fn: a calibration function for calibrating the prepared model
        run_args: positional arguments for `run_fn`
        inplace: carry out model transformations in-place, the original module is mutated
        mapping: correspondence between original module types and quantized counterparts

    Return:
        Quantized model.
    z"quantization_api.quantize.quantizeT©rŒ   )	r1   rƒ   r„   r   r…   r†   Úevalr   r!   )r‹   Úrun_fnÚrun_argsÚmappingrŒ   s        r)   r   r   f  sf   € ô" 
‡HH× Ñ Ð!EÔFØ€Ü:Ó<ˆÙÜ—‘˜eÓ$ˆØ	‡JJ„LÜˆE˜4Õ Ù
ˆ5Ð8ÓÜˆE7 DÕ)Ø€Lr(   c                 óp  — t         j                  j                  d«       |€•|t         j                  k(  r|t        j
                  t        t        j                  t        t        j                  t        t        j                  t        t        j                  t        t        j                  t        i}n·|t         j                  k(  r|t        j
                  t        t        j                  t        t        j                  t        t        j                  t        t        j                  t        t        j                  t        i}n(|t         j                  k(  r+t        j                  t         t        j"                  t         i}nê|t         j$                  k(  rt        j                  t&        i}nÀt)        d|› d«      ‚t+        |t,        «      r¡|t         j                  u rt        }n`|t         j                  u rt        }nG|t         j                  u rt         }n.|t         j$                  u rt&        }nt/        dt1        |«      «      ‚t3        t5        |t7        j8                  |«      «      «      }|€
t;        «       }|st=        j>                  | «      } | jA                  «        tC        | |«       tE        | |d¬«       | S )av  Converts a float model to dynamic (i.e. weights-only) quantized model.

    Replaces specified modules with dynamic weight-only quantized versions and output the quantized model.

    For simplest usage provide `dtype` argument that can be float16 or qint8. Weight-only quantization
    by default is performed for layers with large weights size - i.e. Linear and RNN variants.

    Fine grained control is possible with `qconfig` and `mapping` that act similarly to `quantize()`.
    If `qconfig` is provided, the `dtype` argument is ignored.

    Args:
        model: input model
        qconfig_spec: Either:

            - A dictionary that maps from name or type of submodule to quantization
              configuration, qconfig applies to all submodules of a given
              module unless qconfig for the submodules are specified (when the
              submodule already has qconfig attribute). Entries in the dictionary
              need to be QConfig instances.

            - A set of types and/or submodule names to apply dynamic quantization to,
              in which case the `dtype` argument is used to specify the bit-width

        inplace: carry out model transformations in-place, the original module is mutated
        mapping: maps type of a submodule to a type of corresponding dynamically quantized version
            with which the submodule needs to be replaced

    z*quantization_api.quantize.quantize_dynamicz5Don't know how to quantize with default settings for z. Provide full qconfig pleasez.Unknown dtype specified for quantize_dynamic: Tr¤   )#r1   rƒ   r„   Úqint8ri   ÚLinearr   ÚLSTMÚGRUÚLSTMCellÚRNNCellÚGRUCellÚfloat16r   Úquint8ÚEmbeddingBagr   Ú	EmbeddingÚquint4x2r   Ú
ValueErrorrb   r“   ÚRuntimeErrorÚstrÚdictÚzipÚ	itertoolsÚrepeatr   r…   r†   r¥   r   r!   )r‹   Úqconfig_specÚdtyper¨   rŒ   Údefault_qconfigs         r)   r   r   ‚  sä  € ô< 
‡HH× Ñ Ð!MÔNØÑØ”E—K‘KÒä—	‘	Ô3Ü—‘Ô1Ü—‘Ô0Ü—‘Ô5Ü—
‘
Ô4Ü—
‘
Ô4ðŠLð ”e—m‘mÒ#ä—	‘	Ô3Ü—‘Ô1Ü—‘Ô0Ü—‘Ô5Ü—
‘
Ô4Ü—
‘
Ô4ðŠLð ”e—l‘lÒ"ä—‘Ô"CÜ—‘Ô@ð‰Lð ”e—n‘nÒ$ä—‘Ô"Hð‰Lô ØGÈÀwÐNkÐlónð nä	L¤#Ô	&Ø”E—K‘KÑÜ5‰OØ”e—m‘mÑ#Ü5‰OØ”e—l‘lÑ"Ü?‰OØ”e—n‘nÑ$ÜD‰OäÐOÔQTÐUZÓQ[Ó\Ð\ÜœC ¬i×.>Ñ.>¸Ó.OÓPÓQˆà€Ü;Ó=ˆáÜ—‘˜eÓ$ˆØ	‡JJ„LÜu˜lÔ+ÜˆE7 DÕ)Ø€Lr(   c                 ó2  — t         j                  j                  d«       | j                  sJ d«       ‚|€
t	        «       }|st        j                  | «      } t        | d¬«       t        | |dd¬«       t        | t        |j                  «       «      d¬«       | S )	a  
    Prepares a copy of the model for quantization calibration or
    quantization-aware training and converts it to quantized version.

    Quantization configuration should be assigned preemptively
    to individual submodules in `.qconfig` attribute.

    Args:
        model: input model to be modified in-place
        mapping: dictionary that maps float modules to quantized modules to be
                 replaced.
        inplace: carry out model transformations in-place, the original module
                 is mutated
    z%quantization_api.quantize.prepare_qatz1prepare_qat only works on models in training modeNr   TF)r¨   rŒ   Úremove_qconfig)rŽ   rŒ   )r1   rƒ   r„   Útrainingr   r…   r†   r   r!   r   r“   Úvalues)r‹   r¨   rŒ   s      r)   r   r   ×  s}   € ô 
‡HH× Ñ Ð!HÔIØ>Š>ÐNÐNÓNˆ>Ø€Ü1Ó3ˆáÜ—‘˜eÓ$ˆäu¨4Õ0ÜˆE˜7¨DÀÕGÜˆE´°W·^±^Ó5EÓ1FÐPTÕUØ€Lr(   c                 óØ   — t         j                  j                  d«       |st        j                  | «      } | j                  «        t        | d¬«        || g|¢­Ž  t        | d¬«       | S )ag  Do quantization aware training and output a quantized model

    Args:
        model: input model
        run_fn: a function for evaluating the prepared model, can be a
                function that simply runs the prepared model or a training
                loop
        run_args: positional arguments for `run_fn`

    Return:
        Quantized model.
    z&quantization_api.quantize.quantize_qatTr¤   )r1   rƒ   r„   r…   r†   Útrainr   r!   )r‹   r¦   r§   rŒ   s       r)   r    r    ó  sW   € ô 
‡HH× Ñ Ð!IÔJÙÜ—‘˜eÓ$ˆØ	‡KK„MÜ˜tÕ$Ù
ˆ5Ð8ÓÜˆE˜4Õ Ø€Lr(   c                 ó¬   — t         j                  j                  d«       |st        j                  | «      } t        | |d||¬«       |rt        | «       | S )ag  Converts submodules in input module to a different module according to `mapping`
    by calling `from_float` method on the target module class. And remove qconfig at the
    end if remove_qconfig is set to True.

    Args:
        `module`: prepared and calibrated module
        `mapping`: a dictionary that maps from source module type to target
                   module type, can be overwritten to allow swapping user defined
                   Modules
        `inplace`: carry out model transformations in-place, the original module
                   is mutated
        `convert_custom_config_dict`: custom configuration dictionary for convert function

    .. code-block:: python

       # Example of convert_custom_config_dict:
       convert_custom_config_dict = {
           # user will manually define the corresponding quantized
           # module class which has a from_observed class method that converts
           # observed custom module to quantized custom module
           "observed_to_quantized_custom_module_class": {
               ObservedCustomModule: QuantizedCustomModule
           }
       }

    z!quantization_api.quantize.convertT)rŒ   Úis_referenceÚconvert_custom_config_dict)r1   rƒ   r„   r…   r†   Ú_convertr¢   )r8   r¨   rŒ   rÁ   rÇ   rÈ   s         r)   r!   r!   	  sN   € ô: 
‡HH× Ñ Ð!DÔEÙÜ—‘˜vÓ&ˆÜØ °LØ#=õ?ñ Ü˜ÔØ€Mr(   c                 óš  — |€|r
t        «       n	t        «       }|€
t        «       }|j                  di «      }|st	        j
                  | «      } i }| j                  «       D ]A  \  }}t        |t        «      st        |«      |vrt        ||d||«       t        |||«      ||<   ŒC |j                  «       D ]  \  }	}
|
| j                  |	<   Œ | S )a  Converts submodules in input module to a different module according to `mapping`
    by calling `from_float` method on the target module class

    Args:
        module: input module
        mapping: a dictionary that maps from source module type to target
                 module type, can be overwritten to allow swapping user defined
                 Modules
        inplace: carry out model transformations in-place, the original module
                 is mutated
        is_reference: a flag to enable quantized reference module

    r$   T)r   r   r   r/   r…   r†   r5   rb   r   r   rÉ   r"   r”   r}   )r8   r¨   rŒ   rÇ   rÈ   ru   Úreassignr?   ÚmodÚkeyÚvalues              r)   rÉ   rÉ   0  sç   € ð  €ÙJVÔDÔFÜ9Ó;ð 	à!Ð)Ü%CÓ%EÐ"Ø"<×"@Ñ"@ÐAlÐnpÓ"qÐáÜ—‘˜vÓ&ˆØ€HØ×*Ñ*Ó,ò P‰	ˆˆcô ˜#œ|Ô,Ü'¨Ó,Ð4OÑOÜS˜' 4Ø!Ð#=ô?ä$ S¨'Ð3NÓOˆŠðPð —n‘nÓ&ò %‰
ˆˆUØ$ˆ‰˜Òð%ð €Mr(   c                 ób  — | }t        | d«      rŸ| j                  ’d}t        | «      |v r |t        | «         j                  | «      }d}nžt        | «      |v r‘|t        | «         }t        |d«      rd|j                  rX| j                  €J ‚| j                  j                  «       } || j
                  «       t        |«      }|j                  | |«      }n|j                  | «      }d}|rÃ| j                  j                  «       D ]  }|j                  |«       Œ | j                  j                  «       D ]  }	|	t        usŒ|j                  |	«       Œ t        | «      }
t        |
«      dk  s
J d|
› «       ‚t        |
«      dkD  rt!        t#        |
«      «      nd}|r|j%                  |«       |S )	a	  Swaps the module if it has a quantized counterpart and it has an
    `observer` attached.

    Args:
        mod: input module
        mapping: a dictionary that maps from nn module to nnq module

    Return:
        The corresponding quantized module of `mod`
    r+   NFTÚ_IS_REFERENCEr   zOswap_module only works with cpu or single-device CUDA modules, but got devices r   )rN   r+   r   Úfrom_observedrÐ   Úweightr   ro   r‘   rÃ   rO   r’   rI   rP   re   rf   rg   rh   rX   )rÌ   r¨   ru   Únew_modÚswappedÚqmodÚweight_post_processÚweight_qparamsÚpre_hook_fnr›   rv   rY   s               r)   r"   r"   X  s¤  € ð €GÜˆsIÕ 3§;¡;Ñ#:ØˆÜ'¨Ó,Ð0KÑKØ1Ô2NÈsÓ2SÑT×bÑbÐcfÓgˆGØ‰GÜ)¨#Ó.°'Ñ9ØÔ7¸Ó<Ñ=ˆDÜt˜_Ô-°$×2DÒ2DØ—{‘{Ð.Ð.Ð.Ø&)§k¡k×&8Ñ&8Ó&:Ð#Ù# C§J¡JÔ/Ü!0Ð1DÓ!EØŸ/™/¨#¨~Ó>‘àŸ/™/¨#Ó.ØˆGáà"×5Ñ5×<Ñ<Ó>ò ?Ø×1Ñ1°+Õ>ð?ð ×-Ñ-×4Ñ4Ó6ò ;ØÔ"8Ò8Ø×1Ñ1°'Õ:ð;ô
 +¨3Ó/ˆGÜw“< 1Ò$ð ØaÐbiÐajÐkóÐ$ô -0°«L¸1Ò,<”Tœ$˜w›-Ô(À$ˆFÙØ—
‘
˜6Ô"Ø€Nr(   c                 óº   — d„ }t        | d«      r| j                  | ||«      dz   <   | j                  «       D ]!  \  }}|r ||«      |z   n|}t        |||«       Œ# y)a,  Traverse the modules and save all observers into dict.
    This is mainly used for quantization accuracy debug
    Args:
        mod: the top module we want to save all observers
        prefix: the prefix for the current module
        target_dict: the dictionary used to save all the observers
    c                 ó   — | dk(  r| S | dz   S )NÚ r,   r'   )r;   s    r)   Ú
get_prefixz&_get_observer_dict.<locals>.get_prefix‘  s   € Ø 2šˆvÐ7¨6°C©<Ð7r(   rE   N)rN   rE   r5   Ú_get_observer_dict)rÌ   Útarget_dictr;   rÜ   r?   r@   rA   s          r)   rÝ   rÝ   ‰  sj   € ò8ô ˆsÐ-Ô.ØFI×FaÑFaˆ‘J˜vÓ&Ð)BÑBÑCØ×)Ñ)Ó+ò >‰ˆˆeÙ5;™
 6Ó*¨TÒ1ÀˆÜ˜5 +¨}Õ=ñ>r(   )NrÛ   N)NNr   )NNNN)FNNN)NF)NFTFN)NFFN)rÛ   )Ar…   r»   r‰   r1   Útorch.nnri   Útorch.ao.nn.quantizedr2   Ú	quantizedrl   Útorch.ao.nn.intrinsicr   Ú+torch.ao.quantization.quantization_mappingsr   r   r   r   r   r	   r
   r   Úutilsr   r   Útorch.ao.quantization.stubsr   r   Útorch.ao.quantization.qconfigr   r   r   r   r   r   Útorch.nn.utils.parametrizer   Útorch.ao.quantization.observerr   Úis_activation_post_processÚ__all__r¬   ÚquantizableÚMultiheadAttentionr&   r   r7   r   rI   rK   rS   rq   re   r   r   rŸ   r¢   r   rª   r   r   r    r!   rÉ   r"   rÝ   r'   r(   r)   ú<module>rí      se  ðÛ Û Û ã Ý ß #Ó #Ý .÷	÷ 	ó 	÷ Nß A÷÷ õ DÝ Fõò€ð 	‰—‘×$Ñ$Ø
×Ñ˜rŸ~™~×@Ñ@ð.ð
 	‰×Ñ˜RŸ\™\×.Ñ.Ø
‰×)Ñ)¨2¯<©<×+JÑ+Jð2ñ	Ð ò'ð Z^ó&óPkò,0ò
2ó


óV/òp-òð, .2Ø*.Ø'+ó6òp!ò,,óð8 *.°U·[±[Ø!¨5óSójó8ð. =AØ7;ó%ðP ',Ø7;ó&òP/ôb>r(   