o
    3Ih}]                     @   sb   d dl mZ d dlZd dlmZ d dlmZ d dl	m
Z
 ddlmZmZ dd ZG dd	 d	ZdS )
    )PathN)
ModelProto   )attribute_to_kwargfind_by_namec              	   C   s  t  }|dd | jD  |dd | jD  g }| jD ]w}|}dd |jD }|ri }|jD ]M}i }	|jtjjkrOt	|j
|\}
}|j|
i}	|| n*|jtjjkrug }|jD ]}t	||\}
}||
 || q[|j|i}	nt|}	||	 q1tj|j|j|jfd|ji|}|| q| d | j| |dd | jD  g }| jD ]}|j|v r||j q|| qd	d
 | jD }|D ]0}| j| |j|v rz| j||j  W q ty   |jdk rtd|j d Y qw q|dd | jD  | |fS )zClean unused initializers from graph.

    Returns:
        A cleaned graph without unused initializers
        A list of tensor names, which are not produced by this graph and its subgraphes
    c                 s   s$    | ]}|j D ]}|r|V  qqd S N)input).0node
input_name r   c/home/air/sanwanet/gpt-api/venv/lib/python3.10/site-packages/onnxruntime/quantization/onnx_model.py	<genexpr>   s   " z-_clean_initializers_helper.<locals>.<genexpr>c                 s   s    | ]	}|j r|j V  qd S r   name)r	   g_outr   r   r   r          c                 S   s,   g | ]}|j tjjks|j tjjkr|qS r   )typeonnxAttributeProtoGRAPHGRAPHSr	   attrr   r   r   
<listcomp>   s
    z._clean_initializers_helper.<locals>.<listcomp>r   r
   c                 s   s     | ]}|j D ]}|V  qqd S r   )output)r	   r
   r   r   r   r   r   @   s    c                 S   s   i | ]}|j |qS r   r   r	   r   r   r   r   
<dictcomp>J   s    z._clean_initializers_helper.<locals>.<dictcomp>   zWarning: invalid weight name z' found in the graph (not a graph input)c                 s   s    | ]}|j V  qd S r   r   r   r   r   r   r   T   s    )setupdater
   r   	attributer   r   r   r   _clean_initializers_helpergr   r   graphsappendr   onnx_helper	make_nodeop_typer   
ClearFieldextenddifference_updateinitializerremoveStopIteration
ir_versionprint)graphmodelrequesting_tensor_names	new_nodesr
   new_nodegraph_attrskwargsr   new_attributecleaned_sub_graphsub_requesting_tensor_namescleaned_graphessubgraphunused_initializerr,   name_to_inputr   r   r   r"      sp   





"




r"   c                   @   s  e Zd ZdefddZdd Zdd Zdd	 Zd
d Zdd Z	dd Z
dd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zd d! Zd"efd#d$Zd%d& Zd'd( Zd)d* Zd+d, Zd-d. Zd/d0 Zd1d2 Zdfd4d5Zdfd6d7Zdfd8d9Zd:d; Z d<d= Z!d>d? Z"d@dA Z#e$dBdC Z%e$dDdE Z&dFdG Z'dgdIdJZ(e$dKdL Z)dMdN Z*dOdP Z+e$dQdR Z,dSdT Z-dUdV Z.dWdX Z/dYdZ Z0d"ed[e1fd\d]Z2d^d_ Z3d`da Z4dfdbdcZ5ddde Z6d3S )h	ONNXModelr2   c                 C   s
   || _ d S r   )r2   )selfr2   r   r   r   __init__Z      
zONNXModel.__init__c                 C   
   | j jjS r   )r2   r1   r
   r@   r   r   r   nodes]   rB   zONNXModel.nodesc                 C   rC   r   r2   r1   r,   rD   r   r   r   r,   `   rB   zONNXModel.initializerc                 C   sV   t |dkr
td|  D ]}| |d q|D ]}| | | jjj| qd S )Nr   zCan add an empty list.gain)len
ValueErrorr,   _check_initr2   r1   r%   )r@   initsinitr   r   r   initializer_extendc   s   
zONNXModel.initializer_extendc                 C      | j jS r   )r2   r1   rD   r   r   r   r1   l      zONNXModel.graphc                 C   rN   r   )r2   r/   rD   r   r   r   r/   o   rO   zONNXModel.ir_versionc                 C   rN   r   )r2   opset_importrD   r   r   r   rP   r   rO   zONNXModel.opset_importc                 C   s@   | j jD ]}|j|kr||_ d S q| j jt||g d S r   )r2   rP   domainversionr*   r&   make_opsetid)r@   rQ   rR   opsetr   r   r   set_opset_importu   s   
zONNXModel.set_opset_importc                 C   s&   || j jjv r| j jj| d S d S r   )r2   r1   r
   r-   r@   r
   r   r   r   remove_node}   s   zONNXModel.remove_nodec                 C      |D ]}|  | qd S r   )rW   )r@   nodes_to_remover
   r   r   r   remove_nodes      zONNXModel.remove_nodesc                 C   s   | j jj| |g d S r   )r2   r1   r
   r*   _check_noderV   r   r   r   add_node      zONNXModel.add_nodec                 C   rX   r   )r]   )r@   nodes_to_addr
   r   r   r   	add_nodes   r[   zONNXModel.add_nodesc                 C   s:   t |j| jjjd u r| | | jjj|g d S d S r   )r   r   r2   r1   r,   rJ   r*   )r@   tensorr   r   r   add_initializer   s   
zONNXModel.add_initializerc                 C   &   | j jjD ]}|j|kr|  S qd S r   )r2   r1   r,   r   )r@   r   ra   r   r   r   get_initializer   
   
zONNXModel.get_initializerc                 C   rc   r   )r2   r1   r   r   )r@   r   r   r   r   r   find_graph_input   re   zONNXModel.find_graph_inputc                 C   rc   r   )r2   r1   r   r   )r@   output_namer   r   r   r   find_graph_output   re   zONNXModel.find_graph_outputtensor_namec                 C   sV   dd | j jjD }||v r|| jS | |}|r|jjS | |}|r)|jjS d S )Nc                 S   s   i | ]}|j |jqS r   )r   r   )r	   objr   r   r   r      s    z-ONNXModel.get_tensor_type.<locals>.<dictcomp>)r2   r1   
value_infotensor_typerf   r   rh   )r@   ri   tensor_type_mapg_inputg_outputr   r   r   get_tensor_type   s   


zONNXModel.get_tensor_typec                 C   sr   | j jjD ]#}|jdkr(|jd |kr(|jD ]}|jdkr't|j	    S qq| 
|}|d ur7t|S d S )NConstantr   value)r2   r1   r
   r(   r   r!   r   onnx_numpy_helperto_arraytrd   )r@   rg   r
   r   r,   r   r   r   get_constant_value   s   




zONNXModel.get_constant_valuec                 C   s   dd | j jjD S )Nc                 S   s   h | ]}|j qS r   r   )r	   r,   r   r   r   	<setcomp>       z5ONNXModel.get_initializer_name_set.<locals>.<setcomp>rF   rD   r   r   r   get_initializer_name_set   s   z"ONNXModel.get_initializer_name_setc                 C   sX   || j jjv r(| j jj| | j jjD ]}|j|jkr'| j jj|  d S qd S d S r   )r2   r1   r,   r-   r   r   )r@   ra   r   r   r   r   remove_initializer   s   zONNXModel.remove_initializerc                 C   rX   r   )rz   )r@   init_to_remover,   r   r   r   remove_initializers   r[   zONNXModel.remove_initializersc                 C   s8   |   }t }| jjjD ]}|j|vr||j q|S r   )ry   r   r2   r1   r   r   add)r@   initializer_namesnon_initializer_inputsr   r   r   r   get_non_initializer_inputs   s   
z$ONNXModel.get_non_initializer_inputsc                 C   sJ   i }| j jjD ]}|jD ]}|r!||vr|g||< q|| | qq|S r   )r2   r1   r
   r   r%   )r@   input_name_to_nodesr
   r   r   r   r   r      s   
zONNXModel.input_name_to_nodesc                 C   s0   i }| j jjD ]}|jD ]}|r|||< qq|S r   )r2   r1   r
   r   )r@   output_name_to_noder
   rg   r   r   r   r      s   
zONNXModel.output_name_to_nodeNc                 C   sD   |d u r|   }g }|jD ]}||v r|| D ]}|| qq|S r   )r   r   r%   )r@   r
   r   childrenr   r   r   r   get_children   s   
zONNXModel.get_childrenc                 C   s:   |d u r|   }g }|jD ]}||v r|||  q|S r   )r   r   r%   )r@   r
   r   parentsr   r   r   r   get_parents   s   
zONNXModel.get_parentsc                 C   s@   |d u r|   }t|j|krd S |j| }||vrd S || S r   )r   rH   r   )r@   r
   idxr   r   r   r   r   
get_parent  s   
zONNXModel.get_parentc                 C   s"   t |j}|| t||}|S )zFind out if a node exists in a graph or a node is in the
        new set of nodes created during quantization.

        Returns:
            The node found or None.
        )listr
   r*   r   )r@   	node_namenew_nodes_listr1   graph_nodes_listr
   r   r   r   find_node_by_name  s   


zONNXModel.find_node_by_namec              	   C   sb   d}| j jjD ]'}|jr.|j|r.zt|jt|d }t||}W q ty-   Y qw q|S )z
        Gets the largest node name (int) suffix for all node names that begin with `node_name_prefix`.
        Example: for nodes my_prefix_0 and my_prefix_3, this method returns 3.
        N)	r2   r1   r
   r   
startswithintrH   maxrI   )r@   node_name_prefixsuffixr
   indexr   r   r   get_largest_node_name_suffix  s   z&ONNXModel.get_largest_node_name_suffixc              	   C   s\   d}| j jjD ]$}|j|r+zt|jt|d }t||}W q ty*   Y qw q|S )ab  
        Gets the largest initializer name integer suffix for all initializer names that begin
        with `initializer_name_prefix`. This can be used to create unique initializer names.

        Example: for initializer names 'my_weight_0' and 'my_weight_3', this method returns 3 if
                 `initializer_name_prefix` is 'my_weight_'.
        r   N)	r2   r1   r,   r   r   r   rH   r   rI   )r@   initializer_name_prefixr   r,   r   r   r   r   #get_largest_initializer_name_suffix+  s   z-ONNXModel.get_largest_initializer_name_suffixc                 C   s4   g }|j D ]}|jD ]}||jkr|| q
q|S )zD
        Find all nodes with given initializer as an input.
        )r
   r   r   r%   )r@   r1   r,   rE   r
   
node_inputr   r   r   find_nodes_by_initializer?  s   



z#ONNXModel.find_nodes_by_initializerc                 C   sL   t t|d ddD ]}|| }|jD ]}|j| kr"||f    S qq
dS )Nr   r   )NN)rangerH   r,   r   )r   
graph_pathgidr1   ra   r   r   r   __get_initializerJ  s   

zONNXModel.__get_initializerc                 C   s2  g }| d }|j D ]}}dd |jD }t|roi }|jD ]@}|jdkr3| |j |jt| i}n%|jdkrTg }|j	D ]}	| |	 |
t| g q=|j|i}nt|}|| qtj|j|j|jfd|ji|}|jdkrd}
d}d	}d	}|jD ]-}|jd
krt|}
q|jdkrt|}q|jdkrt|}q|jdkrt|}q|
dkr||dkr||d	kr||jd }|dkr%t|jd | \}}|rt|}t|j}|j|_|j| |jD ]}|j|kr|j|  nq|j
|g n |d7 }tjd|jd g|g|jr|jd ndd}|| tjd|jd	 |g|jd	 t|jdkr<dnd g|jrH|jd ndd}|| t|jdkr{tjd|jd	 d |jd g|j|jrr|jd ndd}|| q	|| q	|| q	|d |j 
| |   |S )Nr   c                 S   s$   g | ]}|j d ks|j dkr|qS )   
   )r   r   r   r   r   r   X  s   $ z8ONNXModel.__replace_gemm_with_matmul.<locals>.<listcomp>r   r   r   Gemmg      ?r   alphabetatransAtransBr   _Transposed	Transpose
_Transpose )inputsoutputsr   MatMul   _MatMulAdd_Addr
   )r
   r!   rH   r   r%   r#   r   r?   $_ONNXModel__replace_gemm_with_matmulr$   r*   r   r    r&   r'   r(   r   r   get_attribute_value_ONNXModel__get_initializerrs   rt   
from_arrayTr,   r-   r)   pop)r   r4   r1   r
   r6   r7   r   kvrr   r<   r   r   r   r   inputBBBs_graphB_arrayB_transr   transpose_nodematmul_noder]   r   r   r   __replace_gemm_with_matmulS  s   

















"


z$ONNXModel.__replace_gemm_with_matmulc                 C   s   |   g}t| d S r   )r1   r?   r   )r@   r   r   r   r   replace_gemm_with_matmul  s   
z"ONNXModel.replace_gemm_with_matmulFc                 C   sZ   |    |rtjj| jdt|jd dd | jjjD ]}| 	|d qt
| j| dS )zS
        Save model to external data, which is needed for model size > 2GB
        Tz.data)all_tensors_to_one_filelocationconvert_attributeendN)topological_sortr   external_data_helperconvert_model_to_external_datar2   r   r   r1   r,   rJ   
save_model)r@   output_pathuse_external_data_formatrL   r   r   r   save_model_to_file  s   zONNXModel.save_model_to_filec                 C   H   t |tr
t |tsJ tt| jD ]}| j| |kr!|| j|< qd S r   )
isinstancestrr   rH   r   )r
   old_input_namenew_input_namejr   r   r   replace_node_input     
zONNXModel.replace_node_inputc                 C   "   | j jjD ]	}t||| qd S r   )r2   r1   r
   r?   r   )r@   r   r   r
   r   r   r   replace_input_of_all_nodes     z$ONNXModel.replace_input_of_all_nodesc                 C   ,   | j jjD ]}|j|v rt||| qd S r   )r2   r1   r
   r   r?   r   )r@   r   r   node_names_setr
   r   r   r   replace_input_of_nodes  
   
z ONNXModel.replace_input_of_nodesc                 C   r   r   )r   r   r   rH   r   )r
   old_output_namenew_output_namer   r   r   r   replace_node_output  r   zONNXModel.replace_node_outputc                 C   r   r   )r2   r1   r
   r?   r   )r@   r   r   r
   r   r   r   replace_output_of_all_nodes  r   z%ONNXModel.replace_output_of_all_nodesc                 C   r   r   )r2   r1   r
   r   r?   r   )r@   r   r   r   r
   r   r   r   replace_output_of_nodes  r   z!ONNXModel.replace_output_of_nodesc                 C   s   |   }g }|  }|D ]}|jdkr'| |jd s'|jd |vr'|| q| | g }|  D ](}|j|vr[| |js[|| | 	 j
D ]}|j|jkrZ| 	 j
| qJq3| | d S )Nrq   r   )r   rE   r(   is_graph_outputr   r%   rZ   r,   r   r1   r   r-   r|   )r@   r   unused_nodesrE   r
   ununsed_weightswgraph_inputr   r   r   remove_unused_constant  s(   



z ONNXModel.remove_unused_constantc                       t  fdd| jjjD S )Nc                 3       | ]}|j  kV  qd S r   r   )r	   r   rg   r   r   r         z,ONNXModel.is_graph_output.<locals>.<genexpr>)anyr2   r1   r   )r@   rg   r   r   r   r      r^   zONNXModel.is_graph_outputreturnc                    r   )Nc                 3   r   r   r   r   ri   r   r   r     r   z+ONNXModel.is_graph_input.<locals>.<genexpr>)r   r2   r1   r   )r@   ri   r   r   r   is_graph_input  r^   zONNXModel.is_graph_inputc                 C   s  dgt |   }i }g }t|  D ]:\}}tdd |jD ||< || dkr3||  |  q|jD ]}|s;q6||vrE|g||< q6|| | q6qdd |  D }dd | jjjD }|| }	|		  d }
|	D ]+}|
|krtqm|}
||v r|| D ]}|| d ||< || dkr||  |  q~qmd}t |}||k r|| j
D ](}||v r|| D ]}|| d ||< || dkr||  |  |d }qq|d }||k s|t |  jksJ d|  d	 |  j| d S )
Nr   c                 s   s    | ]}|rd V  qdS )r   Nr   )r	   _r   r   r   r     s    z-ONNXModel.topological_sort.<locals>.<genexpr>c                 S      g | ]}|j qS r   r   )r	   rL   r   r   r   r     rx   z.ONNXModel.topological_sort.<locals>.<listcomp>c                 S   r   r   r   r   r   r   r   r     rx   r   zGraph is not a DAGr
   )rH   rE   	enumeratesumr   r%   r,   r2   r1   sortr   r
   r)   r*   )r@   
deps_countdeps_to_nodessorted_nodesnode_idxr
   r   r~   graph_input_namesinput_namesprev_input_namestartr   r   r   r   r   r     s\   

zONNXModel.topological_sortc                 C   s   t |  | jS r   )r"   r1   r2   rD   r   r   r   clean_initializers<  s   zONNXModel.clean_initializersc                 C   sJ   |j tjjkr#|dr#t|j}tdd |D r#td|j	d|S )Nraw_datac                 s   s    | ]	}|d @ d kV  qdS )   Nr   )r	   ir   r   r   r   C  r   z(ONNXModel._check_init.<locals>.<genexpr>zInitializer z	 has nan.)
	data_typer   TensorProtoFLOAT8E4M3FNHasFieldr   r   r   rI   r   )r@   rL   testbr   r   r   rJ   ?  s   

zONNXModel._check_initc                 C   sX   |j dkr*|jd }| |}|j}|tjjtjjtjjtjj	hv r*t
d| d|S )z
        A quantization to float 8 does not use quantized bias but float 16 bias.
        This function checks that DequantizeLinear is not used to
        dequantize from float 16.
        DequantizeLinearr   z;Unsupported DequantizeLinear operator, dequantization from .)r(   r   rd   r   r   r   FLOAT16FLOATDOUBLEBFLOAT16RuntimeError)r@   r
   
zero_pointrL   dtyper   r   r   r\   G  s   


zONNXModel._check_noder   )F)7__name__
__module____qualname__r   rA   rE   r,   rM   r1   r/   rP   rU   rW   rZ   r]   r`   rb   rd   rf   rh   r   rp   rv   ry   rz   r|   r   r   r   r   r   r   r   r   r   r   staticmethodr   r   r   r   r   r   r   r   r   r   r   r   boolr   r   r   rJ   r\   r   r   r   r   r?   Y   sj    	





]


4
r?   )pathlibr   r   onnx.helperhelperr&   onnx.numpy_helpernumpy_helperrs   onnx.onnx_pbr   quant_utilsr   r   r"   r?   r   r   r   r   <module>   s   J