U KºcmPã @s<ddlZddlZddlZddlmZddlmmmZddl m mmZejjZ ddlmZmZmZmZmZmZmZddlmZddlmZddlmZmZddlmZddlm Z dd l!m"Z"m#Z#Gd d„dej$ƒZ%eeeee&ee"fee%e%fdœd d„Z'eeee&ee"feeeej(e)feej(e*ffdœdd„Z+eeedœdd„Z,eee*dœdd„Z-eee*dœdd„Z.eee&dœdd„Z/e#e&e#dœdd„Z0e#ddœd d!„Z1d"d#„Z2e2ej(ej(ej(d$œd%d&„ƒZ3e2ej(ej(ej(d$œd'd(„ƒZ4e2ej(ej(ej(d$œd)d*„ƒZ5ee6dœd+d,„Z7eee*ed-œd.d/„Z8dS)0éN)ÚTupleÚCallableÚDictÚSetÚListÚOptionalÚUnion)ÚGraphModule)ÚNode)ÚObserverBaseÚFakeQuantizeBase)Úgetattr_from_fqn)Úis_activation_post_processé)ÚNSNodeTargetTypeÚ NSResultsTypec@s4eZdZe ¡Ze ¡Ze ¡Ze ¡Ze ¡Z dS)ÚNodeInputOrOutputTypeN) Ú__name__Ú __module__Ú__qualname__ÚenumÚautoÚFP32ÚINT8ÚFP16ÚUNKNOWNZFP32_OR_INT8©rrú8/tmp/pip-unpacked-wheel-gikjz4vx/torch/ao/ns/fx/utils.pyrs r)ÚnodeÚgmÚ logger_clsÚnode_type_to_io_type_mapÚreturncsî|d}|d}|d}|d}|d}|d} |d} |d}|jd krÚ|j|kr`tjtjfS|j|krvtjtjfS|j|krŒtjtjfS|j|krÊt||d ƒ}t|tƒs°t ‚t ||||ƒ\} }||fStjtjfSn|jdkrÖ|jdksôt ‚t|jtƒst ‚t ||jƒ‰t‡fdd „| Dƒƒ}tˆ|ttfƒs@|rvt||d ƒ}t|tƒs\t ‚t ||||ƒ\} }||fSt‡fdd „|Dƒƒ}t‡fdd „| Dƒƒ}|r´tjtjfS|rÆtjtjfStjtjfSn|jdkrÞ|jdkr&t||d ƒ}t|tƒs t ‚t ||||ƒ\} }|tjfS|jdkrt||d ƒ}t|tƒsNt ‚t ||||ƒ\} }t||dƒ}|tjks†t |›dƒ‚|tjfS|j|krÒt||d ƒ}t|tƒs¸t ‚t ||||ƒ\} }||fStjtjfStjtjfSdS)NZfuns_io_type_fp32Zfuns_io_type_fp16Zfuns_io_type_int8Zfuns_io_type_fp32_or_int8Zmods_io_type_fp32Zmods_io_type_int8Úmods_io_type_fp32_or_int8Zmeths_io_type_fp32_or_int8Ú call_functionrÚcall_modulec3s|]}tˆ|ƒVqdS©N©Ú isinstance©Ú.0Útarget_type©ÚmodrrÚ Osz7get_node_first_input_and_output_type..c3s|]}tˆ|ƒVqdSr&r'r)r,rrr.asc3s|]}tˆ|ƒVqdSr&r'r)r,rrr.dsÚcall_methodÚ dequantizeÚtorz handling needs to be added)ÚopÚtargetrrrrÚget_normalized_nth_inputr(r ÚAssertionErrorÚ$get_node_first_input_and_output_typerÚstrr ÚanyrrÚtorchZfloat16)rrr r!ZFUNS_IO_TYPE_FP32ZFUNS_IO_TYPE_FP16ZFUNS_IO_TYPE_INT8ZFUNS_IO_TYPE_FP32_OR_INT8ZMODS_IO_TYPE_FP32ZMODS_IO_TYPE_INT8ÚMODS_IO_TYPE_FP32_OR_INT8ZMETHS_IO_TYPE_FP32_OR_INT8Z first_argZ_prev_node_input_typeZprev_node_output_typeÚ"is_known_fp32_or_int8_input_moduleZis_known_fp32_input_moduleZis_known_int8_input_moduleÚ prev_nodeZcur_node_dtype_targetrr,rr6&sÜ ÿýÿÿþÿýÿÿÿý ÿýÿþ ÿýr6)rrr!r"csFt||dƒ}t|tƒsdS|d}dd„}|jdkrz|jtjkrN|||ddƒS|jtjtj tj tjfkrv|||dd ƒSdS|jd krBt|jtƒs–t ‚t||jƒ‰tˆtjtjtjtjtjtjtjtjtjtjtjtjtjtjtjtj tj!tj"tj#tj$tj%tjtj&tj'fƒrˆj(ˆj)fSt*‡fdd„|Dƒƒ}|rBt+|||ƒSdS) z{ Returns the qparams (scale, zero_point) of the first input to `node`, if they can be inferred from the graph. rNr#cSslt|||ƒ}t|||ƒ}t|tƒr.t|jtƒs2t‚t|tƒrHt|jtƒsLt‚t||jƒ}t||jƒ}||fSr&)r4r(r r3r7r5r )rrZ scale_arg_idxZ zp_arg_idxZ scale_nodeZzp_nodeZ scale_objZzp_objrrrÚ _get_scale_zp_from_function_args²sz@get_node_input_qparams.._get_scale_zp_from_function_argsr$réér%c3s|]}tˆ|ƒVqdSr&r'r)©Z module_objrrr.ësz)get_node_input_qparams..),r4r(r r2r3r9Zquantize_per_tensorÚtoqÚaddZadd_reluÚmulZmul_relur7r5r ÚnnqZLinearZConv1dZConv2dÚnniqZ ConvReLU2dZConv3dZBatchNorm2dZBatchNorm3dZConvTranspose1dZConvTranspose2dZELUZ GroupNormZInstanceNorm1dZInstanceNorm2dZInstanceNorm3dZ LayerNormZ HardswishZ LeakyReLUZReLU6ZBNReLU2dZBNReLU3dZ ConvReLU1dZ ConvReLU3dZ LinearReLUZscaleZ zero_pointr8Úget_node_input_qparams)rrr!r<r:r=r;rr@rrF¢sb èþÿrF)rrr"cCs¦|jdkr¢t||jƒ}t|ƒr¢t|jƒdks0t‚t|jdtƒsDt‚|jd}t|jt ƒs^t‚t||jƒ}t|ƒr¢t|jƒdks„t‚t|jdtƒs˜t‚|jd}|S)a‡ If node is not an observer, returns it. If node is an observer, navigates up the graph and returns the first parent which is not an observer. For example, graph: (node_non_obs), node = node_non_obs : returns node_non_obs graph: (node_non_obs -> obs0), node = obs0 : returns node_non_obs graph: (node_non_obs -> obs0 -> fq0), node = fq0 : returns node_non_obs r%rr) r2r r3rÚlenÚargsr5r(r r7©rrZnode_objrrrÚreturn_first_non_observer_nodeôs rJcCs*|jdkr&t||jƒ}t|tjƒr&dSdS)aO Assumes that all non-param args occur first. Returns the number of non-param args expected for a node. For example, for F.linear(x, weight, bias) Returns 1, because x is a non-param arg and weight and bias are params. For lstm_mod(x, hid) Returns 2, because both x and hid are non-param args. r%r>r)r2r r3r(ÚnnZLSTMrIrrrÚget_number_of_non_param_argss rL)rr"cCsˆt|jƒdkrgS|jdkr‚|jtjtjjjtjfksP|jtj tjjj tj fkr‚g}t dƒD] }t|j|ƒtkr\| |¡q\|SdgS)a- Returns the indices of args of the node which we should attach loggers to, if input logging is enabled. For example, * for (x + y), returns [0, 1] * for (1 + y), returns [1] * for (x + 1), returns [0] * for (linear(x, w, b)) returns [0] * by default, returns [0] rr$r>)rGrHr2r3r9rBÚopsÚ quantizedÚoperatorrCÚrangeÚtyper Úappend)rÚresultÚirrrÚ get_arg_indices_of_inputs_to_log+s þýrUcCsPd}|jdkrt |j¡}n0|jdkrLt|jtƒs6t‚t||jƒ}t |¡}|S)zˆ Returns a string representation of the type of the function or module pointed to by this node, or '' for other node types. Ú)r$r/r%)r2r9Útypenamer3r(r7r5r )rrr+Z target_modrrrÚget_target_type_strFs rX)ÚresultsÚ model_namer"c Cs€i}| ¡D]n\}}d}| ¡D]>\}}| ¡D],\}} ||kr0t| ƒsLt‚| dd}q0q0q0q |dk rr|||<q|||<q|S)a Rekeys the layer name of a results dictionary to use node names from `model_name`. For example, transforms {'base_op_1_0': {'node_output': {'model_a': [{'ref_node_name': 'linear1', ...}]}}} into {'linear1': {'node_output': {'model_a': [{'ref_node_name': 'linear1', ...}]}}} Note: we cannot use these node names directly because they are not guaranteed to be consistent across models. This is why we extract the results first and rekey afterwards. NrZ ref_node_name)ÚitemsrGr5) rYrZZnew_resultsZold_layer_nameÚresult_type_to_resultsZnew_layer_nameZ_result_typeÚmodel_name_to_resultsZcur_model_nameZlist_of_resultsrrrÚ'rekey_logger_info_on_node_name_of_modelUs r^)rYr"cCsàd}| ¡D]X\}}| ¡D]B\}}| ¡D],\}}t|ƒdkr,|dddk r,|}qZq,q`qqfq|rÜ| ¡D]h\}}| ¡D]V\}}||}| ¡D]<\}}||kr¬qštt|ƒƒD]} || d} | || d<q¸qšq‚qrdS)ay If `fqn` entries are filled in for one of the models in `results`, copies them over to any models which do not have them filled out. A common use case benefitting from this is comparing a model prepared by quantization to a quantized model. In this case, the model prepared by quantization would have `fqn` entries, and the quantized model would not. NrÚfqn)r[rGrP)rYZmodel_name_with_fqnsZ layer_namer\Zresult_typer]rZZ model_resultsZref_model_resultsrTr_rrrÚmaybe_add_missing_fqns|s(r`cs‡‡fdd„‰ˆS)Nc sÐ|^}}}t|tƒrt|tƒs2t|tƒrjt|tƒrjg}t||ƒD]$\}}||f|˜}| ˆ||Ž¡q@|St|tjƒržt|tjƒrž|jr| ¡}|jrž| ¡}|j tj ks¶|j tj krºdS||f|˜}ˆ||ŽSr&)r(ÚtupleÚlistÚziprRr9ÚTensorZis_quantizedr0ZdtypeÚfloat) rHÚkwargsZa0Za1Za_otherrYZel0Zel1Únew_args©ÚfÚinnerrrrjŸs( ÿÿzGmaybe_dequantize_first_two_tensor_args_and_handle_tuples..innerr)rirrhrÚ8maybe_dequantize_first_two_tensor_args_and_handle_tuplesžsrk)ÚxÚyr"cCs*t |¡}t ||¡}dt ||¡S)zµ Computes the SQNR between `x` and `y`. Args: x: Tensor or tuple of tensors y: Tensor or tuple of tensors Return: float or tuple of floats é)r9ZnormÚlog10)rlrmZPsZPnrrrÚcompute_sqnr»s rpcCs"t ||d ¡|d ¡¡S)zÄ Computes the normalized L2 error between `x` and `y`. Args: x: Tensor or tuple of tensors y: Tensor or tuple of tensors Return: float or tuple of floats r>)r9ÚsqrtÚsum©rlrmrrrÚcompute_normalized_l2_errorÌsrtcCs(| dd¡}| dd¡}tjj ||¡S)zÂ Computes the cosine similarity between `x` and `y`. Args: x: Tensor or tuple of tensors y: Tensor or tuple of tensors Return: float or tuple of floats réÿÿÿÿ)Zreshaper9rKZ functionalZcosine_similarityrsrrrÚcompute_cosine_similarityÛsrvcCs4|jdkr0|jtjtjtjtjtjtjfkr0dSdS)Nr$FT)r2r3r9rBrCrOÚcatÚstack)rrrrÚop_type_supports_shadowingîs "ry)rrÚidxr"cCs6z¼|j|dd}|dk rb|\}}t|ƒt|ƒ|ks8t‚|t|ƒkrN||WSt| ¡ƒ|WSnXt|jƒt|jƒ|ks~t‚|t|jƒkr˜|j|WS|t|jƒ}t|j ¡ƒ|WSWnttk r0t|jƒt|jƒ|ksêt‚|t|jƒkr|j|YS|t|jƒ}t|j ¡ƒ|YSYnXdS)zu Given a node, gets the n'th input to that node, normalizing args and kwargs to the best of its ability. T)Znormalize_to_only_use_kwargsN)Znormalized_argumentsrGr5rbÚvaluesrHrfÚRuntimeError)rrrzZnorm_args_and_kwargsZ norm_argsZnorm_kwargsZ kwargs_idxrrrr4õs,ÿ r4)9rrOr9Ztorch.nnrKZtorch.nn.intrinsic.quantizedZ intrinsicrNrEZtorch.ao.nn.quantizedZaorDrMrAÚtypingrrrrrrrZtorch.fxr Ztorch.fx.graphr Ztorch.ao.quantizationrrZtorch.ao.quantization.utilsr Ztorch.ao.quantization.quantizerZns_typesrrÚEnumrr7r6rdreÚintrFrJrLrUrXr^r`rkrprtrvÚboolryr4rrrrÚsb$ û}"üSýýý'"