Ë
    œÐVhÌ  ã                   ó€   — U d dl Z d dlmZ g Zee   ed<    G d„ de j                  j                  j                  «      Z
y)é    N)Ú	ParameterÚ__all__c                   ó6  ‡ — e Zd ZdZ	 	 	 	 	 	 dˆ fd„	Zej                  j                  d„ «       Zej                  j                  d„ «       Z	ej                  j                  d„ «       Z
ej                  j                  dd„«       Zej                  j                  dd„«       Zej                  j                  dd„«       Zej                  j                  dd	„«       Zej                  j                  d
„ «       Zej                  j                  d„ «       Zd„ Zˆ xZS )Ú_LearnableFakeQuantizea  Generalized extension of the FakeQuantize module in fake_quantize.py.

    This is an extension of the FakeQuantize module in fake_quantize.py, which
    supports more generalized lower-bit quantization and supports learning of the scale
    and zero point parameters through backpropagation.

    In addition to the attributes in the original FakeQuantize module, the _LearnableFakeQuantize
    module also includes the following attributes to support quantization parameter learning.

    * :attr:`channel_len` defines the length of the channel when initializing scale and zero point
      for the per channel case.

    * :attr:`use_grad_scaling` defines the flag for whether the gradients for scale and zero point are
      normalized by the constant, which is proportional to the square root of the number of
      elements in the tensor. The related literature justifying the use of this particular constant
      can be found here: https://openreview.net/pdf?id=rkgO66VKDS.

    * :attr:`fake_quant_enabled` defines the flag for enabling fake quantization on the output.

    * :attr:`static_enabled` defines the flag for using observer's static estimation for
      scale and zero point.

    * :attr:`learning_enabled` defines the flag for enabling backpropagation for scale and zero point.
    c                 ób  •— t         ‰
|   «        ||k  sJ d«       ‚|| _        || _        ||d<   ||d<   || _        |dk(  rIt        t        j                  |g«      «      | _        t        t        j                  |g«      «      | _	        njt        |t        «      r|dkD  sJ d«       ‚t        t        j                  |g|z  «      «      | _        t        t        j                  |g|z  «      «      | _	         |di |¤Ž| _        t        j                  | j                  j                  «      j                  |k  sJ d«       ‚|t        j                  | j                  j                  «      j                   k  sJ d«       ‚| j                  j                  | _        | j                  j"                  | _        t%        | j                  d	«      r| j                  j&                  nd| _        | j)                  d
t        j                  dgt        j*                  ¬«      «       | j)                  dt        j                  dgt        j*                  ¬«      «       | j)                  dt        j                  dgt        j*                  ¬«      «       t        j                  ||z
  dz   «      j-                  «       }	t        t        j.                  |	«      j1                  «       «      | _        | j)                  dt        j                  t        j4                  t        j6                  «      j8                  g«      «       y )Nz/quant_min must be strictly less than quant_max.Ú	quant_minÚ	quant_maxéÿÿÿÿr   z(Channel size must be a positive integer.zquant_min out of boundzquant_max out of boundÚch_axisÚfake_quant_enabledé   )ÚdtypeÚstatic_enabledÚlearning_enabledÚeps© )ÚsuperÚ__init__r   r	   Úuse_grad_scalingr   ÚtorchÚtensorÚscaleÚ
zero_pointÚ
isinstanceÚintÚactivation_post_processÚiinfor   ÚminÚmaxÚqschemeÚhasattrr   Úregister_bufferÚuint8ÚdoubleÚlog2ÚitemÚbitwidthÚfinfoÚfloat32r   )ÚselfÚobserverr   r	   r   r   Úchannel_lenr   Úobserver_kwargsÚbitrangeÚ	__class__s             €ú^/home/dcms/DCMS/lib/python3.12/site-packages/torch/ao/quantization/_learnable_fake_quantize.pyr   z_LearnableFakeQuantize.__init__$   s  ø€ ô 	‰ÑÔØ˜9Ò$ÐWÐ&WÓWÐ$Ø"ˆŒØ"ˆŒà'0ˆ˜Ñ$Ø'0ˆ˜Ñ$Ø 0ˆÔØ˜"ÒÜ"¤5§<¡<°°Ó#8Ó9ˆDŒJÜ'¬¯©°j°\Ó(BÓCˆDOô ˜;¬Ô,°¸q²ð:à9ó:Ø@ä"¤5§<¡<°°¸+Ñ0EÓ#FÓGˆDŒJÜ'¬¯©°j°\ÀKÑ5OÓ(PÓQˆDŒOá'/Ñ'B°/Ñ'BˆÔ$äK‰K˜×4Ñ4×:Ñ:Ó;×?Ñ?À9ÒLð	$à#ó	$ØLð œŸ™ T×%AÑ%A×%GÑ%GÓH×LÑLÒLð	$à#ó	$ØLà×1Ñ1×7Ñ7ˆŒ
Ø×3Ñ3×;Ñ;ˆŒô t×3Ñ3°YÔ?ð ×(Ñ(×0Ò0àð 	Œð
 	×ÑÐ1´5·<±<ÀÀÌ5Ï;É;Ô3WÔXØ×ÑÐ-¬u¯|©|¸Q¸CÄuÇ{Á{Ô/SÔTØ×ÑÐ/´·±¸q¸cÌÏÉÔ1UÔVä—<‘< 	¨IÑ 5¸Ñ 9Ó:×AÑAÓCˆÜœEŸJ™J xÓ0×5Ñ5Ó7Ó8ˆŒØ×Ñ˜U¤E§L¡L´%·+±+¼e¿m¹mÓ2L×2PÑ2PÐ1QÓ$RÕSó    c                 ój   — | j                  d¬«      j                  d¬«      j                  d¬«       | S )zÎEnable parameter learning over static observer estimates.

        Enables learning of quantization parameters and
        disables static observer estimates. Forward path returns fake quantized X.
        T©ÚenabledF©Útoggle_qparam_learningÚtoggle_fake_quantÚtoggle_observer_update©r*   s    r0   Úenable_param_learningz,_LearnableFakeQuantize.enable_param_learningW   s<   € ð 	×#Ñ#¨DÐ#Ó1×CÑCØð 	Dó 	
ç
 Ñ
 ¨Ð
 Ô
/Øˆr1   c                 óh   — | j                  d¬«      j                  d¬«      j                  d¬«       y)zÈEnable static estimates of quantization parameters.

        Enables static observer estimates and disables learning of
        quantization parameters. Forward path returns fake quantized X.
        Fr3   TNr5   r9   s    r0   Úenable_static_estimatez-_LearnableFakeQuantize.enable_static_estimatec   s7   € ð 	×#Ñ#¨EÐ#Ó2×DÑDØð 	Eó 	
ç
 Ñ
 ¨Ð
 Õ
.r1   c                 óh   — | j                  d¬«      j                  d¬«      j                  d¬«       y)zéEnable accumulation of data without updating quantization parameters.

        Enables static observer accumulating data from input but doesn't
        update the quantization parameters. Forward path returns the original X.
        Fr3   TNr5   r9   s    r0   Úenable_static_observationz0_LearnableFakeQuantize.enable_static_observationn   s7   € ð 	×#Ñ#¨EÐ#Ó2×DÑDØð 	Eó 	
ç
 Ñ
 ¨Ð
 Õ
.r1   c                 ó6   — t        |«      | j                  d<   | S ©Nr   )r   r   ©r*   r4   s     r0   r8   z-_LearnableFakeQuantize.toggle_observer_updatey   s   € ä!$ W£ˆ×Ñ˜AÑØˆr1   c                 ó&   — | j                  |«       y )N)r8   rA   s     r0   Úenable_observerz&_LearnableFakeQuantize.enable_observer~   s   € à×#Ñ# GÕ,r1   c                 óz   — t        |«      | j                  d<   || j                  _        || j                  _        | S r@   )r   r   r   Úrequires_gradr   rA   s     r0   r6   z-_LearnableFakeQuantize.toggle_qparam_learning‚   s3   € ä#& w£<ˆ×Ñ˜aÑ Ø#*ˆ
‰
Ô Ø(/ˆ‰Ô%Øˆr1   c                 ó6   — t        |«      | j                  d<   | S r@   )r   r   rA   s     r0   r7   z(_LearnableFakeQuantize.toggle_fake_quant‰   s   € ä%(¨£\ˆ×Ñ Ñ"Øˆr1   c                 óœ   — t        d| j                  j                  «       › «       t        d| j                  j                  «       › «       y )Nz_LearnableFakeQuantize Scale: z#_LearnableFakeQuantize Zero Point: )Úprintr   Údetachr   r9   s    r0   Úobserve_quant_paramsz+_LearnableFakeQuantize.observe_quant_paramsŽ   s>   € äÐ.¨t¯z©z×/@Ñ/@Ó/BÐ.CÐDÔEÜÐ3°D·O±O×4JÑ4JÓ4LÐ3MÐNÕOr1   c                 ón  — | j                   j                  j                  | j                  j	                  «       ¬«       | j                   j                  «       }| j                  j                  «       j                  «       j                  | j                  | j                  «      j                  «       }||fS )N©r   )r   ÚdataÚclamp_r   r&   rI   r   ÚroundÚclampr   r	   Úlong)r*   r   r   s      r0   Úcalculate_qparamsz(_LearnableFakeQuantize.calculate_qparams“   s{   € à
‰
‰×Ñ 4§8¡8§=¡=£?ÐÔ3Ø—
‘
×!Ñ!Ó#ˆàO‰O×"Ñ"Ó$ß‰U‹Wß‰U4—>‘> 4§>¡>Ó2ß‰T‹Vð	 	ð jÐ Ð r1   c           	      óì  — | j                   d   dk(  rÑ| j                  |j                  «       «       | j                  j                  «       \  }}|j	                  | j
                  j                  «      }|j	                  | j                  j                  «      }| j
                  j                  j                  |«       | j                  j                  j                  |«       n>| j
                  j                  j                  | j                  j                  «       ¬«       | j                  d   dk(  r?| j                  t        j                   t        j"                  fv r$| j                  j                  j%                  «        | j&                  r$d|j)                  «       | j*                  z  dz  z  }nd}| j                  t        j                   t        j,                  fv rOt        j.                  || j
                  | j                  | j0                  | j2                  | j*                  |«      }|S t        j4                  || j
                  | j                  | j2                  | j*                  |«      }|S )Nr   r   rL   ç      ð?g      à?)r   r   rI   rR   Útor   Údevicer   rM   Úcopy_rN   r   r&   r   r    r   Úper_channel_symmetricÚper_tensor_symmetricÚzero_r   Únumelr	   Úper_channel_affineÚ+_fake_quantize_learnable_per_channel_affiner   r   Ú*_fake_quantize_learnable_per_tensor_affine)r*   ÚXÚ_scaleÚ_zero_pointÚgrad_factors        r0   Úforwardz_LearnableFakeQuantize.forwardŸ   sÕ  € Ø×Ñ˜qÑ! QÒ&Ø×(Ñ(¨¯©«Ô4Ø"&×">Ñ">×"PÑ"PÓ"RÑˆFKØ—Y‘Y˜tŸz™z×0Ñ0Ó1ˆFØ%Ÿ.™.¨¯©×)?Ñ)?Ó@ˆKØJ‰JO‰O×!Ñ! &Ô)ØO‰O× Ñ ×&Ñ& {Õ3àJ‰JO‰O×"Ñ" t§x¡x§}¡}£Ð"Ô7à×"Ñ" 1Ñ%¨Ó*Ø|‰|Ü×+Ñ+Ü×*Ñ*ð ñ ð —‘×$Ñ$×*Ñ*Ô,à×$Ò$Ø! Q§W¡W£Y°·±Ñ%?ÀCÑ$GÑG‘à!Ø|‰|¤× ;Ñ ;¼U×=UÑ=UÐVÑVÜ×EÑEØØ—J‘JØ—O‘OØ—L‘LØ—N‘NØ—N‘NØóð& ˆô ×DÑDØØ—J‘JØ—O‘OØ—N‘NØ—N‘NØóð ˆr1   )r   éÿ   rT   g        r
   F)T)Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   ÚjitÚexportr:   r<   r>   r8   rC   r6   r7   rJ   rR   rc   Ú__classcell__)r/   s   @r0   r   r   
   s8  ø„ ñð8 ØØØØØõ1Tðf ‡YY×Ññ	ó ð	ð ‡YY×Ññ/ó ð/ð ‡YY×Ññ/ó ð/ð ‡YY×Ñòó ðð ‡YY×Ñò-ó ð-ð ‡YY×Ñòó ðð ‡YY×Ñòó ðð ‡YY×ÑñPó ðPð ‡YY×Ññ	!ó ð	!ö*r1   r   )r   Útorch.nn.parameterr   r   ÚlistÚstrÚ__annotations__ÚaoÚquantizationÚFakeQuantizeBaser   r   r1   r0   ú<module>rs      s;   ðô Ý (ð €ˆˆc‰Ó ô˜UŸX™X×2Ñ2×CÑCõ r1   