U
    <ºct  ã                   @   s¼  d dl Z d dlZd dlmZ d dlm  m  mZ d dlm  m  m	Z
 d dlm  mZ d dlmZ d dlmZ d dlmZmZmZ d dlmZ d dlmZ ddd	d
dddddddgZejejejdœZedejjj dZ!G dd„ dejjj ej"ƒZ#G dd„ de#ej$ƒZ%G dd„ de%ƒZ&G dd	„ d	e
j$ej"ƒZ'G dd
„ d
e#ej(ƒZ)G dd„ de)ƒZ*G dd„ de
j(ej"ƒZ+G dd„ de#ej,ƒZ-G dd„ de-ƒZ.G dd„ de
j,ej"ƒZ/d d„ Z0d!d„ Z1dS )"é    N)Úinit)Úfuse_conv_bn_weights)Ú_singleÚ_pairÚ_triple)Ú	Parameter)ÚTypeVarÚConvBn1dÚConvBnReLU1dÚ
ConvReLU1dÚConvBn2dÚConvBnReLU2dÚ
ConvReLU2dÚConvBn3dÚConvBnReLU3dÚ
ConvReLU3dÚupdate_bn_statsÚfreeze_bn_stats)é   é   é   ÚMOD)Úboundc                       s¤   e Zd ZdZeZd%dd„Zdd	„ Zd
d„ Z‡ fdd„Z	dd„ Z
dd„ Zdd„ Zdd„ Zdd„ Z‡ fdd„Zdd„ Zd&dd„Z‡ fdd „Zed!d"„ ƒZd#d$„ Z‡  ZS )'Ú	_ConvBnNdr   çñhãˆµøä>çš™™™™™¹?FNc                 C   sÄ   t jjj | |||||||||	d|¡ |s2tdƒ‚|| _| jrB|nd| _t	| |||ddƒ| _
| j ¡ | _|
r€tt |¡ƒ| _n|  dd ¡ |  ¡  | jr²|r¨|  ¡  qº|  ¡  n|  ¡  d| _d S )NFú'qconfig must be provided for QAT moduleTÚbias)ÚnnÚmodulesÚconvÚ_ConvNdÚ__init__ÚAssertionErrorÚqconfigÚtrainingÚ	freeze_bnÚ_BN_CLASS_MAPÚbnÚweightÚweight_fake_quantr   ÚtorchÚemptyr   Zregister_parameterÚreset_bn_parametersr   r   Ú0_enable_slow_path_for_better_numerical_stability)ÚselfÚin_channelsÚout_channelsÚkernel_sizeÚstrideÚpaddingÚdilationZ
transposedZoutput_paddingÚgroupsr   Úpadding_modeÚepsÚmomentumr&   r$   Údim© r;   úM/tmp/pip-unpacked-wheel-gikjz4vx/torch/nn/intrinsic/qat/modules/conv_fused.pyr"      s2          þ

z_ConvBnNd.__init__c                 C   s   | j  ¡  d S ©N)r(   Úreset_running_stats©r/   r;   r;   r<   r>   H   s    z_ConvBnNd.reset_running_statsc                 C   sd   | j  ¡  t | j j¡ t | j j¡ | jd k	r`t | j¡\}}dt 	|¡ }t | j| |¡ d S )Nr   )
r(   r>   r   Zuniform_r)   Zzeros_r   Z_calculate_fan_in_and_fan_outÚmathÚsqrt)r/   Zfan_inÚ_r   r;   r;   r<   r-   K   s    

z_ConvBnNd.reset_bn_parametersc                    s   t t| ƒ ¡  d S r=   )Úsuperr   Úreset_parametersr?   ©Ú	__class__r;   r<   rD   U   s    z_ConvBnNd.reset_parametersc                 C   s   d| _ d| j_| S )NFT©r&   r(   r%   r?   r;   r;   r<   r   X   s    z_ConvBnNd.update_bn_statsc                 C   s   d| _ d| j_| S )NTFrG   r?   r;   r;   r<   r   ]   s    z_ConvBnNd.freeze_bn_statsc                 C   s   | j r|  |¡S |  |¡S r=   )r.   Ú_forward_slowÚ_forward_approximate©r/   Úinputr;   r;   r<   Ú_forwardb   s    
z_ConvBnNd._forwardc           
      C   sô   | j jdk	st‚t | j j| j j ¡}| j j| }dgt| jjƒ }d|d< dgt| jjƒ }d|d< |  	| j| 
|¡ ¡}| jdk	rštj| j|jd}ntj| j|j|jd}|  |||¡}|| 
|¡ }	| jdk	ræ|	| j 
|¡ }	|   |	¡}|S )z©Approximated method to fuse conv and bn. It requires only one forward pass.
        conv_orig = conv / scale_factor where scale_factor = bn.weight / running_std
        Nr   éÿÿÿÿr   )Údtype©ÚdevicerN   )r(   Úrunning_varr#   r+   rA   r8   r)   ÚlenÚshaper*   Úreshaper   Z
zeros_likerN   Úzerosr1   rP   Ú_conv_forward)
r/   rK   Úrunning_stdÚscale_factorÚweight_shapeÚ
bias_shapeÚscaled_weightÚ	zero_biasr    Z	conv_origr;   r;   r<   rI   g   s"    


z_ConvBnNd._forward_approximatec              	   C   sð  | j jdk	st‚| j jdk	s t‚tj| j| jj|j	d}dgt
| jjƒ }d|d< dgt
| jjƒ }d|d< | j jrÀ|  || j|¡}t ¡ . | jdkrœ|n|| j |¡ }|   |¡ W 5 Q R X t | j j| j j ¡}| j j| }|  | j| |¡ ¡}	|  ||	|¡}
| j jr‚dgttdt
| jjƒƒƒ }| |¡}t || |¡ ¡ |¡}t || j j ¡}|| }|
| |¡9 }
|}|}n"| j j| jdk	rš| jnd }|}| j j| j j| |  }|
| |¡7 }
| jdk	rì|
| j| j  |¡7 }
|
S )aH  
        A more accurate but slow method to compute conv bn fusion, following https://arxiv.org/pdf/1806.08342.pdf
        It requires two forward passes but handles the case bn.weight == 0

        Conv: Y = WX + B_c
        Conv without bias: Y0 = WX = Y - B_c, Y = Y0 + B_c

        Batch statistics:
          mean_Y = Y.mean()
                 = Y0.mean() + B_c
          var_Y = (Y - mean_Y)^2.mean()
                = (Y0 - Y0.mean())^2.mean()
        BN (r: bn.weight, beta: bn.bias):
          Z = r * (Y - mean_Y) / sqrt(var_Y + eps) + beta
            = r * (Y0 - Y0.mean()) / sqrt(var_Y + eps) + beta

        Fused Conv BN training (std_Y = sqrt(var_Y + eps)):
          Z = (r * W / std_Y) * X + r * (B_c - mean_Y) / std_Y + beta
            = (r * W / std_Y) * X - r * Y0.mean() / std_Y + beta

        Fused Conv BN inference (running_std = sqrt(running_var + eps)):
          Z = (r * W / running_std) * X - r * (running_mean - B_c) / running_std + beta

        QAT with fused conv bn:
          Z_train = fake_quant(r * W / running_std) * X * (running_std / std_Y) - r * Y0.mean() / std_Y + beta
                  = conv(X, fake_quant(r * W / running_std)) * (running_std / std_Y) - r * Y0.mean() / std_Y + beta
          Z_inference = conv(X, fake_quant(r * W / running_std)) - r * (running_mean - B_c) / running_std + beta
        NrO   r   rM   r   r   )r(   rQ   r#   Úrunning_meanr+   rU   r1   r)   rP   rN   rR   rS   r%   rV   Zno_gradr   rT   rA   r8   r*   ÚlistÚrangeZmeanZsquare)r/   rK   r\   rY   rZ   Zconv_outZconv_out_biasrW   rX   r[   Zconv_bnZavg_dimsZ
batch_meanZ	batch_varZ	batch_stdZunscale_factorZ
fused_meanZ	fused_stdZ
fused_biasr;   r;   r<   rH   €   sJ    
ÿÿ

ÿz_ConvBnNd._forward_slowc                    s   t t| ƒ ¡ S r=   )rC   r   Ú
extra_reprr?   rE   r;   r<   r`   Û   s    z_ConvBnNd.extra_reprc                 C   s
   |   |¡S r=   )rL   rJ   r;   r;   r<   Úforwardß   s    z_ConvBnNd.forwardTc                 C   s(   || _ | js$|  ¡ D ]}| |¡ q| S )zä
        Batchnorm's training behavior is using the self.training flag. Prevent
        changing it if BN is frozen. This makes sure that calling `model.train()`
        on a model with a frozen BN will behave properly.
        )r%   r&   ÚchildrenÚtrain)r/   ÚmodeÚmoduler;   r;   r<   rc   â   s
    z_ConvBnNd.trainc              	      s®   |  dd ¡}|d ks|dkrŽddddddœ}	|	 ¡ D ]X\}
}|| |krl|||  |||
 < | || ¡ q4||
 |krzq4|r4| ||
 ¡ q4tt| ƒ |||||||¡ d S )	NÚversionr   ÚgammaÚbetar]   rQ   Únum_batches_tracked)z	bn.weightzbn.biaszbn.running_meanzbn.running_varzbn.num_batches_tracked)ÚgetÚitemsÚpopÚappendrC   r   Ú_load_from_state_dict)r/   Z
state_dictÚprefixZlocal_metadataÚstrictZmissing_keysZunexpected_keysZ
error_msgsrf   Zv2_to_v1_namesZv2_nameZv1_namerE   r;   r<   rn     s2    û	
      ÿz_ConvBnNd._load_from_state_dictc                 C   sà   t |ƒ| jks(td| j d | jj ƒ‚t|dƒs:tdƒ‚|jsHtdƒ‚|j}|d |d  }}| |j|j|j|j	|j
|j|j|jdk	|j|j|jd	|ƒ}|j|_|j|_|j|j_|j|j_|j|j_|j|j_|j|j_|S )
z¾Create a qat module from a float module or qparams_dict

            Args: `mod` a float module, either produced by torch.ao.quantization utilities
            or directly from user
        zqat.z.from_float only works for r$   z,Input float module must have qconfig definedz,Input float module must have a valid qconfigr   r   NF)ÚtypeÚ_FLOAT_MODULEr#   Ú__name__Úhasattrr$   r0   r1   r2   r3   r4   r5   r6   r   r7   r8   r9   r)   r(   r]   rQ   ri   )ÚclsÚmodr$   r    r(   Z
qat_convbnr;   r;   r<   Ú
from_float#  s6    	ÿ    ú


z_ConvBnNd.from_floatc                 C   sø   t | ƒ}| | j| j| j| j| j| j| j| j	d k	| j
¡	}tj | j ¡ ¡|_| j	d k	rjtj | j	 ¡ ¡|_	|jr¤t|j|j	| jj| jj| jj| jj| jj	ƒ\|_|_	|jräg }| |¡ | ¡ }| |¡ |j|Ž }| | j¡ |S | | j¡ |S d S r=   )rq   Ú_FLOAT_CONV_MODULEr0   r1   r2   r3   r4   r5   r6   r   r7   r+   r   r   r)   ÚdetachÚ_FLOAT_BN_MODULEr   r(   r]   rQ   r8   Ú_FLOAT_RELU_MODULErm   Ú_FUSED_FLOAT_MODULErc   r%   )r/   ru   r    r   ÚreluZ	conv_relur;   r;   r<   Úto_floatC  sF    ÷

ù



z_ConvBnNd.to_float)r   r   FNr   )T)rs   Ú
__module__Ú__qualname__Ú_versionr   rr   r"   r>   r-   rD   r   r   rL   rI   rH   r`   ra   rc   rn   Úclassmethodrw   r~   Ú__classcell__r;   r;   rE   r<   r      s.         ñ
*
[
"
r   c                
   @   s0   e Zd ZdZejZdZej	Z
ejZdd	d
„ZdS )r	   aÅ  
    A ConvBn1d module is a module fused from Conv1d and BatchNorm1d,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv1d` and
    :class:`torch.nn.BatchNorm1d`.

    Similar to :class:`torch.nn.Conv1d`, with FakeQuantize modules initialized
    to default.

    Attributes:
        freeze_bn:
        weight_fake_quant: fake quant module for weight

    Nr   r   rU   r   r   Fc                 C   sT   t |ƒ}t |ƒ}t |ƒ}t |ƒ}tj| ||||||dt dƒ|||	|
|||dd d S )NFr   r   ©r:   )r   r   r"   ©r/   r0   r1   r2   r3   r4   r5   r6   r   r7   r8   r9   r&   r$   r;   r;   r<   r"     s$              þzConvBn1d.__init__)
r   r   r   r   NrU   r   r   FN)rs   r   r€   Ú__doc__r   ÚBatchNorm1drz   r{   Únnir	   rr   ÚConv1drx   r"   r;   r;   r;   r<   r	   k  s                 óc                
       sX   e Zd ZdZejZejZ	ej
ZejZejZd‡ fd	d
„	Zdd„ Ze‡ fdd„ƒZ‡  ZS )r
   aÐ  
    A ConvBnReLU1d module is a module fused from Conv1d, BatchNorm1d and ReLU,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv1d` and
    :class:`torch.nn.BatchNorm1d` and :class:`torch.nn.ReLU`.

    Similar to `torch.nn.Conv1d`, with FakeQuantize modules initialized to
    default.

    Attributes:
        weight_fake_quant: fake quant module for weight

    r   r   NrU   r   r   Fc                    s(   t ƒ  |||||||||	|
|||¡ d S r=   )rC   r"   r…   rE   r;   r<   r"   ¯  s         üzConvBnReLU1d.__init__c                 C   s   t  t | |¡¡S r=   )ÚFr}   r	   rL   rJ   r;   r;   r<   ra   Ã  s    zConvBnReLU1d.forwardc                    s   t t| ƒ |¡S r=   )rC   r
   rw   ©ru   rv   rE   r;   r<   rw   Æ  s    zConvBnReLU1d.from_float)
r   r   r   r   NrU   r   r   FN)rs   r   r€   r†   rˆ   r
   rr   r   r‰   rx   r‡   rz   ÚReLUr{   r   r|   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r
   —  s(                óc                       sP   e Zd ZdZejZejZ	dZ
ejZd‡ fdd„	Zd	d
„ Ze‡ fdd„ƒZ‡  ZS )r   aC  A ConvReLU1d module is a fused module of Conv1d and ReLU, attached with
    FakeQuantize modules for weight for
    quantization aware training.

    We combined the interface of :class:`~torch.nn.Conv1d` and
    :class:`~torch.nn.BatchNorm1d`.

    Attributes:
        weight_fake_quant: fake quant module for weight

    Nr   r   TrU   c                    sF   t t| ƒj|||||||||	|
d
 |
s0tdƒ‚|
| _| j ¡ | _d S ©N)r3   r4   r5   r6   r   r7   r$   r   )rC   r   r"   r#   r$   r)   r*   ©r/   r0   r1   r2   r3   r4   r5   r6   r   r7   r$   rE   r;   r<   r"   Û  s        ýzConvReLU1d.__init__c                 C   s   t  |  ||  | j¡| j¡¡S r=   ©rŠ   r}   rV   r*   r)   r   rJ   r;   r;   r<   ra   ç  s    ÿzConvReLU1d.forwardc                    s   t t| ƒ |¡S r=   )rC   r   rw   r‹   rE   r;   r<   rw   ë  s    zConvReLU1d.from_float)r   r   r   r   TrU   N)rs   r   r€   r†   rˆ   r   rr   r   r‰   rx   rz   rŒ   r{   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r   Ê  s              ýc                
   @   s0   e Zd ZdZejZejZ	ej
ZdZdd	d
„ZdS )r   aÅ  
    A ConvBn2d module is a module fused from Conv2d and BatchNorm2d,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv2d` and
    :class:`torch.nn.BatchNorm2d`.

    Similar to :class:`torch.nn.Conv2d`, with FakeQuantize modules initialized
    to default.

    Attributes:
        freeze_bn:
        weight_fake_quant: fake quant module for weight

    Nr   r   rU   r   r   Fc                 C   sT   t |ƒ}t |ƒ}t |ƒ}t |ƒ}tj| ||||||dt dƒ|||	|
|||dd d S )NFr   r   r„   )r   r   r"   r…   r;   r;   r<   r"     s$              þzConvBn2d.__init__)
r   r   r   r   NrU   r   r   FN)rs   r   r€   r†   rˆ   r   rr   r   ÚConv2drx   ÚBatchNorm2drz   r{   r"   r;   r;   r;   r<   r   ï  s                 óc                
       sX   e Zd ZdZejZejZ	ej
ZejZejZd‡ fd	d
„	Zdd„ Ze‡ fdd„ƒZ‡  ZS )r   aÐ  
    A ConvBnReLU2d module is a module fused from Conv2d, BatchNorm2d and ReLU,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv2d` and
    :class:`torch.nn.BatchNorm2d` and :class:`torch.nn.ReLU`.

    Similar to `torch.nn.Conv2d`, with FakeQuantize modules initialized to
    default.

    Attributes:
        weight_fake_quant: fake quant module for weight

    r   r   NrU   r   r   Fc                    s,   t t| ƒ |||||||||	|
|||¡ d S r=   )rC   r   r"   r…   rE   r;   r<   r"   3  s         üzConvBnReLU2d.__init__c                 C   s   t  t | |¡¡S r=   )rŠ   r}   r   rL   rJ   r;   r;   r<   ra   G  s    zConvBnReLU2d.forwardc                    s   t t| ƒ |¡S r=   )rC   r   rw   r‹   rE   r;   r<   rw   J  s    zConvBnReLU2d.from_float)
r   r   r   r   NrU   r   r   FN)rs   r   r€   r†   rˆ   r   rr   r   r   rx   r‘   rz   rŒ   r{   r   r|   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r     s(                óc                       sP   e Zd ZdZejZejZ	dZ
ejZd‡ fdd„	Zd	d
„ Ze‡ fdd„ƒZ‡  ZS )r   aC  A ConvReLU2d module is a fused module of Conv2d and ReLU, attached with
    FakeQuantize modules for weight for
    quantization aware training.

    We combined the interface of :class:`~torch.nn.Conv2d` and
    :class:`~torch.nn.BatchNorm2d`.

    Attributes:
        weight_fake_quant: fake quant module for weight

    Nr   r   TrU   c                    sF   t t| ƒj|||||||||	|
d
 |
s0tdƒ‚|
| _| j ¡ | _d S r   )rC   r   r"   r#   r$   r)   r*   rŽ   rE   r;   r<   r"   _  s        ýzConvReLU2d.__init__c                 C   s   t  |  ||  | j¡| j¡¡S r=   r   rJ   r;   r;   r<   ra   k  s    ÿzConvReLU2d.forwardc                    s   t t| ƒ |¡S r=   )rC   r   rw   r‹   rE   r;   r<   rw   o  s    zConvReLU2d.from_float)r   r   r   r   TrU   N)rs   r   r€   r†   rˆ   r   rr   r   r   rx   rz   rŒ   r{   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r   N  s              ýc                
   @   s0   e Zd ZdZejZejZ	ej
ZdZdd	d
„ZdS )r   aÅ  
    A ConvBn3d module is a module fused from Conv3d and BatchNorm3d,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv3d` and
    :class:`torch.nn.BatchNorm3d`.

    Similar to :class:`torch.nn.Conv3d`, with FakeQuantize modules initialized
    to default.

    Attributes:
        freeze_bn:
        weight_fake_quant: fake quant module for weight

    Nr   r   rU   r   r   Fc                 C   sT   t |ƒ}t |ƒ}t |ƒ}t |ƒ}tj| ||||||dt dƒ|||	|
|||dd d S )NFr   r   r„   )r   r   r"   r…   r;   r;   r<   r"   ‰  s.    ïzConvBn3d.__init__)
r   r   r   r   NrU   r   r   FN)rs   r   r€   r†   rˆ   r   rr   r   ÚConv3drx   ÚBatchNorm3drz   r{   r"   r;   r;   r;   r<   r   s  s              ìc                
       sX   e Zd ZdZejZejZ	ej
ZejZejZd‡ fd	d
„	Zdd„ Ze‡ fdd„ƒZ‡  ZS )r   aÐ  
    A ConvBnReLU3d module is a module fused from Conv3d, BatchNorm3d and ReLU,
    attached with FakeQuantize modules for weight,
    used in quantization aware training.

    We combined the interface of :class:`torch.nn.Conv3d` and
    :class:`torch.nn.BatchNorm3d` and :class:`torch.nn.ReLU`.

    Similar to `torch.nn.Conv3d`, with FakeQuantize modules initialized to
    default.

    Attributes:
        weight_fake_quant: fake quant module for weight

    r   r   NrU   r   r   Fc                    s,   t t| ƒ |||||||||	|
|||¡ d S r=   )rC   r   r"   r…   rE   r;   r<   r"   Î  s    
ózConvBnReLU3d.__init__c                 C   s   t  t | |¡¡S r=   )rŠ   r}   r   rL   rJ   r;   r;   r<   ra   ô  s    zConvBnReLU3d.forwardc                    s   t t| ƒ |¡S r=   )rC   r   rw   r‹   rE   r;   r<   rw   ÷  s    zConvBnReLU3d.from_float)
r   r   r   r   NrU   r   r   FN)rs   r   r€   r†   rˆ   r   rr   r   r’   rx   r“   rz   rŒ   r{   r   r|   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r   ·  s(             ì&c                       sP   e Zd ZdZejZejZ	dZ
ejZd‡ fdd„	Zd	d
„ Ze‡ fdd„ƒZ‡  ZS )r   aC  A ConvReLU3d module is a fused module of Conv3d and ReLU, attached with
    FakeQuantize modules for weight for
    quantization aware training.

    We combined the interface of :class:`~torch.nn.Conv3d` and
    :class:`~torch.nn.BatchNorm3d`.

    Attributes:
        weight_fake_quant: fake quant module for weight

    Nr   r   TrU   c                    sF   t t| ƒj|||||||||	|
d
 |
s0tdƒ‚|
| _| j ¡ | _d S r   )rC   r   r"   r#   r$   r)   r*   rŽ   rE   r;   r<   r"     s    
özConvReLU3d.__init__c                 C   s   t  |  ||  | j¡| j¡¡S r=   r   rJ   r;   r;   r<   ra   )  s    ÿzConvReLU3d.forwardc                    s   t t| ƒ |¡S r=   )rC   r   rw   r‹   rE   r;   r<   rw   .  s    zConvReLU3d.from_float)r   r   r   r   TrU   N)rs   r   r€   r†   rˆ   r   rr   r   r’   rx   rz   rŒ   r{   r"   ra   r‚   rw   rƒ   r;   r;   rE   r<   r   û  s           õc                 C   s(   t | ƒtttttttgƒkr$|  ¡  d S r=   )	rq   Úsetr
   r   r   r	   r   r   r   ©rv   r;   r;   r<   r   2  s    ÿc                 C   s(   t | ƒtttttttgƒkr$|  ¡  d S r=   )	rq   r”   r
   r   r   r	   r   r   r   r•   r;   r;   r<   r   8  s    ÿ)2r@   r+   Ztorch.nnr   Ztorch.ao.nn.intrinsicZaoZ	intrinsicrˆ   Ztorch.ao.nn.qatZqatZnnqatZtorch.nn.functionalZ
functionalrŠ   r   Ztorch.nn.utilsr   Ztorch.nn.modules.utilsr   r   r   Ztorch.nn.parameterr   Útypingr   Ú__all__r‡   r‘   r“   r'   r   r    r!   r   Z_FusedModuler   r‰   r	   r
   r   r   r   r   r   r’   r   r   r   r   r   r;   r;   r;   r<   Ú<module>   sF      ÿý  T,3%,3%DD7