o
    h8P                     @   sx  d dl Z d dlZd dlZd dlmZ d dlm  m  m  mZ	 d dl
m  m  mZ ejjZd dlmZmZmZmZmZmZmZ d dlmZ d dlmZ d dlmZmZ d dlmZ d dlm Z  dd	l!m"Z"m#Z# G d
d de j$Z%dedededee&ee" f dee%e%f f
ddZ'dededee&ee" f deeeej(e)f eej(e*f f  fddZ+dededefddZ,dedede*fddZ-dedee* fddZ.dedede&fddZ/de#de&de#fdd Z0de#ddfd!d"Z1d#d$ Z2e2d%ej(d&ej(dej(fd'd(Z3e2d%ej(d&ej(dej(fd)d*Z4e2d%ej(d&ej(dej(fd+d,Z5dede6fd-d.Z7deded/e*defd0d1Z8dS )2    N)TupleCallableDictSetListOptionalUnion)GraphModule)Node)ObserverBaseFakeQuantizeBase)getattr_from_fqn)_is_activation_post_process   )NSNodeTargetTypeNSResultsTypec                   @   s4   e Zd Ze Ze Ze Ze Ze Z	dS )NodeInputOrOutputTypeN)
__name__
__module____qualname__enumautoFP32INT8FP16UNKNOWNFP32_OR_INT8 r   r   J/var/www/html/ai/venv/lib/python3.10/site-packages/torch/ao/ns/fx/utils.pyr      s    r   nodegm
logger_clsnode_type_to_io_type_mapreturnc                    s  |d }|d }|d }|d }|d }|d }	|d }
|d }| j d	krk| j|v r0tjtjfS | j|v r;tjtjfS | j|v rFtjtjfS | j|v ret| |d
}t|tsXJ t	||||\}}||fS tj
tj
fS | j dkr| j dkswJ t| jtsJ t|| j t fdd|
D }t |ttfs|rt| |d
}t|tsJ t	||||\}}||fS t fdd|D }t fdd|	D }|rtjtjfS |rtjtjfS tj
tj
fS | j dkrc| jdkrt| |d
}t|tsJ t	||||\}}|tjfS | jdkr<t| |d
}t|tsJ t	||||\}}t| |d}|tju s7J | d|tjfS | j|v r]t| |d
}t|tsPJ t	||||\}}||fS tj
tj
fS tj
tj
fS )Nfuns_io_type_fp32funs_io_type_fp16funs_io_type_int8funs_io_type_fp32_or_int8mods_io_type_fp32mods_io_type_int8mods_io_type_fp32_or_int8meths_io_type_fp32_or_int8call_functionr   call_modulec                 3       | ]}t  |V  qd S N
isinstance.0target_typemodr   r   	<genexpr>O       

z7get_node_first_input_and_output_type.<locals>.<genexpr>c                 3   r.   r/   r0   r2   r5   r   r   r7   a   r8   c                 3   r.   r/   r0   r2   r5   r   r   r7   d   r8   call_method
dequantizetor   z handling needs to be added)optargetr   r   r   r   get_normalized_nth_inputr1   r
   $get_node_first_input_and_output_typer   strr   anyr   r   torchfloat16)r   r    r!   r"   FUNS_IO_TYPE_FP32FUNS_IO_TYPE_FP16FUNS_IO_TYPE_INT8FUNS_IO_TYPE_FP32_OR_INT8MODS_IO_TYPE_FP32MODS_IO_TYPE_INT8MODS_IO_TYPE_FP32_OR_INT8METHS_IO_TYPE_FP32_OR_INT8	first_arg_prev_node_input_typeprev_node_output_type"is_known_fp32_or_int8_input_moduleis_known_fp32_input_moduleis_known_int8_input_module	prev_nodecur_node_dtype_targetr   r5   r   r?   &   s   







r?   c                    s@  t | |d}t|tsdS |d }dd }|jdkr=|jtjkr'|||ddS |jtjtj	tj
tjfv r;|||dd	S dS |jd
krt|jtsJJ t||j t tjtjtjtjtjtjtjtjtjtjtjtjtjtjtjtjtj tj!tj"tj#tj$tjtj%tj&fr j' j(fS t) fdd|D }|rt*|||S dS )z{
    Returns the qparams (scale, zero_point) of the first input to `node`,
    if they can be inferred from the graph.
    r   Nr*   c                 S   sl   t | ||}t | ||}t|trt|jtsJ t|tr$t|jts&J t||j}t||j}||fS r/   )r>   r1   r
   r=   r@   r   )r   r    scale_arg_idx
zp_arg_idx
scale_nodezp_node	scale_objzp_objr   r   r    _get_scale_zp_from_function_args   s   z@get_node_input_qparams.<locals>._get_scale_zp_from_function_argsr,   r         r-   c                 3   r.   r/   r0   r2   
module_objr   r   r7      r8   z)get_node_input_qparams.<locals>.<genexpr>)+r>   r1   r
   r<   r=   rB   quantize_per_tensortoqaddadd_relumulmul_relur@   r   nnqLinearConv1dConv2dnniq
ConvReLU2dConv3dBatchNorm2dBatchNorm3dConvTranspose1dConvTranspose2dELU	GroupNormInstanceNorm1dInstanceNorm2dInstanceNorm3d	LayerNorm	Hardswish	LeakyReLUReLU6BNReLU2dBNReLU3d
ConvReLU1d
ConvReLU3d
LinearReLUscale
zero_pointrA   get_node_input_qparams)r   r    r"   rR   rJ   rZ   rO   r   r]   r   r      sb   	

	
r   c                 C   s   | j dkrQt|| j}t|rQt| jdksJ t| jd ts"J | jd } t| jts/J t|| j}t|rQt| jdksBJ t| jd tsLJ | jd } | S )a  
    If node is not an observer, returns it.  If node is an observer,
    navigates up the graph and returns the first parent which is not an
    observer.  For example,

    graph: (node_non_obs), node = node_non_obs : returns node_non_obs
    graph: (node_non_obs -> obs0), node = obs0 : returns node_non_obs
    graph: (node_non_obs -> obs0 -> fq0), node = fq0 : returns node_non_obs
    r-   r   r   )	r<   r   r=   r   lenargsr1   r
   r@   r   r    node_objr   r   r   return_first_non_observer_node   s   


r   c                 C   s*   | j dkrt|| j}t|tjrdS dS )aO  
    Assumes that all non-param args occur first. Returns the number of
    non-param args expected for a node.  For example, for

      F.linear(x, weight, bias)

    Returns 1, because x is a non-param arg and weight and bias are params.
    For

      lstm_mod(x, hid)

    Returns 2, because both x and hid are non-param args.
    r-   r[   r   )r<   r   r=   r1   nnLSTMr   r   r   r   get_number_of_non_param_args  s
   
r   c                 C   s   t | jdkr	g S | jdkrA| jtjtjjjtjfv s(| jtj	tjjj	tj	fv rAg }t
dD ]}t| j| tkr>|| q.|S dgS )a-  
    Returns the indices of args of the node which we should attach
    loggers to, if input logging is enabled.

    For example,
    * for (x + y), returns [0, 1]
    * for (1 + y), returns [1]
    * for (x + 1), returns [0]
    * for (linear(x, w, b)) returns [0]
    * by default, returns [0]
    r   r,   r[   )r   r   r<   r=   rB   ra   ops	quantizedoperatorrc   rangetyper
   append)r   resultir   r   r    get_arg_indices_of_inputs_to_log+  s   

r   c                 C   sR   d}| j dv rt| j}|S | j dkr't| jtsJ t|| j}t|}|S )z
    Returns a string representation of the type of the function or module
    pointed to by this node, or '' for other node types.
     )r,   r9   r-   )r<   rB   typenamer=   r1   r@   r   )r   r    r4   
target_modr   r   r   get_target_type_strF  s   


r   results
model_namec           	      C   sz   i }|   D ]4\}}d}| D ]}|  D ]\}}||kr+t|s$J |d d }qqq|dur6|||< q|||< q|S )a	  
    Rekeys the layer name of a results dictionary to use node names
    from `model_name`.

    For example, transforms

        {'base_op_1_0': {'node_output': {'model_a':
          [{'ref_node_name': 'linear1', ...}]}}}

    into

        {'linear1': {'node_output': {'model_a':
          [{'ref_node_name': 'linear1', ...}]}}}

    Note: we cannot use these node names directly because they are not
    guaranteed to be consistent across models. This is why we extract
    the results first and rekey afterwards.
    Nr   ref_node_name)itemsvaluesr   )	r   r   new_resultsold_layer_nameresult_type_to_resultsnew_layer_namemodel_name_to_resultscur_model_namelist_of_resultsr   r   r   'rekey_logger_info_on_node_name_of_modelU  s   

r   c           	      C   s   d}|   D ]$}|  D ]}| D ]\}}t|dkr(|d d dur(|} nq  |rb|   D ]2}|  D ])}|| }| D ]\}}||krJqAtt|D ]}|| d }||| d< qPqAq7q1dS dS )ay  
    If `fqn` entries are filled in for one of the models in `results`, copies
    them over to any models which do not have them filled out.

    A common use case benefitting from this is comparing a model prepared by
    quantization to a quantized model. In this case, the model prepared by
    quantization would have `fqn` entries, and the quantized model would not.
    Nr   fqn)r   r   r   r   )	r   model_name_with_fqnsr   r   r   model_resultsref_model_resultsr   r   r   r   r   maybe_add_missing_fqns|  s4   r   c                    s    fddS )Nc            	         s   | ^}}}t |trt |tst |tr8t |tr8g }t||D ]\}}||g|R }||i | q |S t |tjrRt |tjrR|jrK| }|jrR| }|j	tj
ks^|j	tj
kr`d S ||g|R } |i |S r/   )r1   tuplelistzipr   rB   Tensoris_quantizedr:   dtypefloat)	r   kwargsa0a1a_otherr   el0el1new_argsfinnerr   r   r     s(   
zGmaybe_dequantize_first_two_tensor_args_and_handle_tuples.<locals>.innerr   )r   r   r   r   8maybe_dequantize_first_two_tensor_args_and_handle_tuples  s   r   xyc                 C   s*   t | }t | | }dt ||  S )z
    Computes the SQNR between `x` and `y`.

    Args:
        x: Tensor or tuple of tensors
        y: Tensor or tuple of tensors

    Return:
        float or tuple of floats
       )rB   normlog10)r   r   PsPnr   r   r   compute_sqnr  s   
r   c                 C   s"   t | | d  | d   S )z
    Computes the normalized L2 error between `x` and `y`.

    Args:
        x: Tensor or tuple of tensors
        y: Tensor or tuple of tensors

    Return:
        float or tuple of floats
    r[   )rB   sqrtsumr   r   r   r   r   compute_normalized_l2_error  s   "r   c                 C   s(   |  dd} | dd}tjj| |S )z
    Computes the cosine similarity between `x` and `y`.

    Args:
        x: Tensor or tuple of tensors
        y: Tensor or tuple of tensors

    Return:
        float or tuple of floats
    r   )reshaperB   r   
functionalcosine_similarityr   r   r   r   compute_cosine_similarity  s   r   c                 C   s4   | j dkr| jtjtjtjtjtjtjfv rdS dS )Nr,   FT)r<   r=   rB   ra   rc   r   catstack)r   r   r   r   op_type_supports_shadowing  s   
"r   idxc                 C   s"  z[| j |dd}|dur0|\}}t|t| |ksJ |t|k r'|| W S t| | W S t| jt| j |ks>J |t| jk rK| j| W S |t| j }t| j | W S  ty   t| jt| j |kspJ |t| jk r~| j|  Y S |t| j }t| j |  Y S w )zu
    Given a node, gets the n'th input to that node, normalizing
    args and kwargs to the best of its ability.
    T)normalize_to_only_use_kwargsN)normalized_argumentsr   r   r   r   r   RuntimeError)r   r    r   norm_args_and_kwargs	norm_argsnorm_kwargs
kwargs_idxr   r   r   r>     s,   
r>   )9r   r   rB   torch.nnr   torch.ao.nn.intrinsic.quantizedao	intrinsicr   ri   torch.ao.nn.quantizedre   r   r`   typingr   r   r   r   r   r   r   torch.fxr	   torch.fx.graphr
   torch.ao.quantizationr   r   torch.ao.quantization.utilsr   torch.ao.quantization.observerr   ns_typesr   r   Enumr   r@   r?   r   r   intr   r   r   r   r   r   r   r   r   r   r   boolr   r>   r   r   r   r   <module>   s    $

|"
R


'"