o
    g]                     @   sb   d dl mZ d dlZd dlmZ d dlmZ d dl	m
Z
 ddlmZmZ dd ZG dd	 d	ZdS )
    )PathN)
ModelProto   )attribute_to_kwargfind_by_namec              	   C   s  t  }|dd | jD  |dd | jD  g }| jD ]w}|}dd |jD }|ri }|jD ]M}i }	|jtjjkrOt	|j
|\}
}|j|
i}	|| n*|jtjjkrug }|jD ]}t	||\}
}||
 || q[|j|i}	nt|}	||	 q1tj|j|j|jfd|ji|}|| q| d | j| |dd | jD  g }| jD ]}|j|v r||j q|| qd	d
 | jD }|D ]0}| j| |j|v rz| j||j  W q ty   |jdk rtd|j d Y qw q|dd | jD  | |fS )zClean unused initializers from graph.

    Returns:
        A cleaned graph without unused initializers
        A list of tensor names, which are not produced by this graph and its subgraphes
    c                 s   s$    | ]}|j D ]}|r|V  qqd S N)input).0node
input_name r   Z/var/www/visachat/venv/lib/python3.10/site-packages/onnxruntime/quantization/onnx_model.py	<genexpr>   s   " z-_clean_initializers_helper.<locals>.<genexpr>c                 s   s    | ]	}|j r|j V  qd S r   name)r	   g_outr   r   r   r      s    c                 S   s,   g | ]}|j tjjks|j tjjkr|qS r   )typeonnxAttributeProtoGRAPHGRAPHSr	   attrr   r   r   
<listcomp>   s
    z._clean_initializers_helper.<locals>.<listcomp>r   r
   c                 s   s     | ]}|j D ]}|V  qqd S r   )output)r	   r
   r   r   r   r   r   @   s    c                 S   s   i | ]}|j |qS r   r   r	   r   r   r   r   
<dictcomp>J   s    z._clean_initializers_helper.<locals>.<dictcomp>   zWarning: invalid weight name z' found in the graph (not a graph input)c                 s   s    | ]}|j V  qd S r   r   r   r   r   r   r   T   s    )setupdater
   r   	attributer   r   r   r   _clean_initializers_helpergr   r   graphsappendr   onnx_helper	make_nodeop_typer   
ClearFieldextenddifference_updateinitializerremoveStopIteration
ir_versionprint)graphmodelrequesting_tensor_names	new_nodesr
   new_nodegraph_attrskwargsr   new_attributecleaned_sub_graphsub_requesting_tensor_namescleaned_graphessubgraphunused_initializerr+   name_to_inputr   r   r   r!      sp   





"




r!   c                   @   s  e Zd ZdefddZdd Zdd Zdd	 Zd
d Zdd Z	dd Z
dd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zd d! Zd"efd#d$Zd%d& Zd'd( Zd)d* Zd+d, Zd-d. Zd/d0 Zd1d2 Zdfd4d5Zdfd6d7Zdfd8d9Zd:d; Z d<d= Z!d>d? Z"d@dA Z#e$dBdC Z%e$dDdE Z&dFdG Z'dgdIdJZ(e$dKdL Z)dMdN Z*dOdP Z+e$dQdR Z,dSdT Z-dUdV Z.dWdX Z/dYdZ Z0d"ed[e1fd\d]Z2d^d_ Z3d`da Z4dfdbdcZ5ddde Z6d3S )h	ONNXModelr1   c                 C   s
   || _ d S r   )r1   )selfr1   r   r   r   __init__Z      
zONNXModel.__init__c                 C   
   | j jjS r   )r1   r0   r
   r?   r   r   r   nodes]   rA   zONNXModel.nodesc                 C   rB   r   r1   r0   r+   rC   r   r   r   r+   `   rA   zONNXModel.initializerc                 C   sV   t |dkr
td|  D ]}| |d q|D ]}| | | jjj| qd S )Nr   zCan add an empty list.gain)len
ValueErrorr+   _check_initr1   r0   r$   )r?   initsinitr   r   r   initializer_extendc   s   
zONNXModel.initializer_extendc                 C      | j jS r   )r1   r0   rC   r   r   r   r0   l      zONNXModel.graphc                 C   rM   r   )r1   r.   rC   r   r   r   r.   o   rN   zONNXModel.ir_versionc                 C   rM   r   )r1   opset_importrC   r   r   r   rO   r   rN   zONNXModel.opset_importc                 C   s@   | j jD ]}|j|kr||_ d S q| j jt||g d S r   )r1   rO   domainversionr)   r%   make_opsetid)r?   rP   rQ   opsetr   r   r   set_opset_importu   s   
zONNXModel.set_opset_importc                 C   s&   || j jjv r| j jj| d S d S r   )r1   r0   r
   r,   r?   r
   r   r   r   remove_node}   s   zONNXModel.remove_nodec                 C      |D ]}|  | qd S r   )rV   )r?   nodes_to_remover
   r   r   r   remove_nodes      zONNXModel.remove_nodesc                 C   s   | j jj| |g d S r   )r1   r0   r
   r)   _check_noderU   r   r   r   add_node      zONNXModel.add_nodec                 C   rW   r   )r\   )r?   nodes_to_addr
   r   r   r   	add_nodes   rZ   zONNXModel.add_nodesc                 C   s:   t |j| jjjd u r| | | jjj|g d S d S r   )r   r   r1   r0   r+   rI   r)   )r?   tensorr   r   r   add_initializer   s   
zONNXModel.add_initializerc                 C   &   | j jjD ]}|j|kr|  S qd S r   )r1   r0   r+   r   )r?   r   r`   r   r   r   get_initializer   
   
zONNXModel.get_initializerc                 C   rb   r   )r1   r0   r   r   )r?   r   r   r   r   r   find_graph_input   rd   zONNXModel.find_graph_inputc                 C   rb   r   )r1   r0   r   r   )r?   output_namer   r   r   r   find_graph_output   rd   zONNXModel.find_graph_outputtensor_namec                 C   sV   dd | j jjD }||v r|| jS | |}|r|jjS | |}|r)|jjS d S )Nc                 S   s   i | ]}|j |jqS r   )r   r   )r	   objr   r   r   r      s    z-ONNXModel.get_tensor_type.<locals>.<dictcomp>)r1   r0   
value_infotensor_typere   r   rg   )r?   rh   tensor_type_mapg_inputg_outputr   r   r   get_tensor_type   s   


zONNXModel.get_tensor_typec                 C   sr   | j jjD ]#}|jdkr(|jd |kr(|jD ]}|jdkr't|j	    S qq| 
|}|d ur7t|S d S )NConstantr   value)r1   r0   r
   r'   r   r    r   onnx_numpy_helperto_arraytrc   )r?   rf   r
   r   r+   r   r   r   get_constant_value   s   




zONNXModel.get_constant_valuec                 C   s   dd | j jjD S )Nc                 S   s   h | ]}|j qS r   r   )r	   r+   r   r   r   	<setcomp>       z5ONNXModel.get_initializer_name_set.<locals>.<setcomp>rE   rC   r   r   r   get_initializer_name_set   s   z"ONNXModel.get_initializer_name_setc                 C   sX   || j jjv r(| j jj| | j jjD ]}|j|jkr'| j jj|  d S qd S d S r   )r1   r0   r+   r,   r   r   )r?   r`   r   r   r   r   remove_initializer   s   zONNXModel.remove_initializerc                 C   rW   r   )ry   )r?   init_to_remover+   r   r   r   remove_initializers   rZ   zONNXModel.remove_initializersc                 C   s8   |   }t }| jjjD ]}|j|vr||j q|S r   )rx   r   r1   r0   r   r   add)r?   initializer_namesnon_initializer_inputsr   r   r   r   get_non_initializer_inputs   s   
z$ONNXModel.get_non_initializer_inputsc                 C   sJ   i }| j jjD ]}|jD ]}|r!||vr|g||< q|| | qq|S r   )r1   r0   r
   r   r$   )r?   input_name_to_nodesr
   r   r   r   r   r      s   
zONNXModel.input_name_to_nodesc                 C   s0   i }| j jjD ]}|jD ]}|r|||< qq|S r   )r1   r0   r
   r   )r?   output_name_to_noder
   rf   r   r   r   r      s   
zONNXModel.output_name_to_nodeNc                 C   sD   |d u r|   }g }|jD ]}||v r|| D ]}|| qq|S r   )r   r   r$   )r?   r
   r   childrenr   r   r   r   get_children   s   
zONNXModel.get_childrenc                 C   s:   |d u r|   }g }|jD ]}||v r|||  q|S r   )r   r   r$   )r?   r
   r   parentsr   r   r   r   get_parents   s   
zONNXModel.get_parentsc                 C   s@   |d u r|   }t|j|krd S |j| }||vrd S || S r   )r   rG   r   )r?   r
   idxr   r   r   r   r   
get_parent  s   
zONNXModel.get_parentc                 C   s"   t |j}|| t||}|S )zFind out if a node exists in a graph or a node is in the
        new set of nodes created during quantization.

        Returns:
            The node found or None.
        )listr
   r)   r   )r?   	node_namenew_nodes_listr0   graph_nodes_listr
   r   r   r   find_node_by_name  s   


zONNXModel.find_node_by_namec              	   C   sb   d}| j jjD ]'}|jr.|j|r.zt|jt|d }t||}W q ty-   Y qw q|S )z
        Gets the largest node name (int) suffix for all node names that begin with `node_name_prefix`.
        Example: for nodes my_prefix_0 and my_prefix_3, this method returns 3.
        N)	r1   r0   r
   r   
startswithintrG   maxrH   )r?   node_name_prefixsuffixr
   indexr   r   r   get_largest_node_name_suffix  s   z&ONNXModel.get_largest_node_name_suffixc              	   C   s\   d}| j jjD ]$}|j|r+zt|jt|d }t||}W q ty*   Y qw q|S )ab  
        Gets the largest initializer name integer suffix for all initializer names that begin
        with `initializer_name_prefix`. This can be used to create unique initializer names.

        Example: for initializer names 'my_weight_0' and 'my_weight_3', this method returns 3 if
                 `initializer_name_prefix` is 'my_weight_'.
        r   N)	r1   r0   r+   r   r   r   rG   r   rH   )r?   initializer_name_prefixr   r+   r   r   r   r   #get_largest_initializer_name_suffix+  s   z-ONNXModel.get_largest_initializer_name_suffixc                 C   s4   g }|j D ]}|jD ]}||jkr|| q
q|S )zD
        Find all nodes with given initializer as an input.
        )r
   r   r   r$   )r?   r0   r+   rD   r
   
node_inputr   r   r   find_nodes_by_initializer?  s   



z#ONNXModel.find_nodes_by_initializerc                 C   sL   t t|d ddD ]}|| }|jD ]}|j| kr"||f    S qq
dS )Nr   r   )NN)rangerG   r+   r   )r   
graph_pathgidr0   r`   r   r   r   __get_initializerJ  s   

zONNXModel.__get_initializerc                 C   s2  g }| d }|j D ]}}dd |jD }t|roi }|jD ]@}|jdkr3| |j |jt| i}n%|jdkrTg }|j	D ]}	| |	 |
t| g q=|j|i}nt|}|| qtj|j|j|jfd|ji|}|jdkrd}
d}d	}d	}|jD ]-}|jd
krt|}
q|jdkrt|}q|jdkrt|}q|jdkrt|}q|
dkr||dkr||d	kr||jd }|dkr%t|jd | \}}|rt|}t|j}|j|_|j| |jD ]}|j|kr|j|  nq|j
|g n |d7 }tjd|jd g|g|jr|jd ndd}|| tjd|jd	 |g|jd	 t|jdkr<dnd g|jrH|jd ndd}|| t|jdkr{tjd|jd	 d |jd g|j|jrr|jd ndd}|| q	|| q	|| q	|d |j 
| |   |S )Nr   c                 S   s$   g | ]}|j d ks|j dkr|qS )   
   )r   r   r   r   r   r   X  s   $ z8ONNXModel.__replace_gemm_with_matmul.<locals>.<listcomp>r   r   r   Gemmg      ?r   alphabetatransAtransBr   _Transposed	Transpose
_Transpose )inputsoutputsr   MatMul   _MatMulAdd_Addr
   )r
   r    rG   r   r$   r"   r   r>   $_ONNXModel__replace_gemm_with_matmulr#   r)   r   r   r%   r&   r'   r   r   get_attribute_value_ONNXModel__get_initializerrr   rs   
from_arrayTr+   r,   r(   pop)r   r3   r0   r
   r5   r6   r   kvrq   r;   r   r   r   r   inputBBBs_graphB_arrayB_transr   transpose_nodematmul_noder\   r   r   r   __replace_gemm_with_matmulS  s   

















"


z$ONNXModel.__replace_gemm_with_matmulc                 C   s   |   g}t| d S r   )r0   r>   r   )r?   r   r   r   r   replace_gemm_with_matmul  s   
z"ONNXModel.replace_gemm_with_matmulFc                 C   sZ   |    |rtjj| jdt|jd dd | jjjD ]}| 	|d qt
| j| dS )zS
        Save model to external data, which is needed for model size > 2GB
        Tz.data)all_tensors_to_one_filelocationconvert_attributeendN)topological_sortr   external_data_helperconvert_model_to_external_datar1   r   r   r0   r+   rI   
save_model)r?   output_pathuse_external_data_formatrK   r   r   r   save_model_to_file  s   zONNXModel.save_model_to_filec                 C   H   t |tr
t |tsJ tt| jD ]}| j| |kr!|| j|< qd S r   )
isinstancestrr   rG   r   )r
   old_input_namenew_input_namejr   r   r   replace_node_input     
zONNXModel.replace_node_inputc                 C   "   | j jjD ]	}t||| qd S r   )r1   r0   r
   r>   r   )r?   r   r   r
   r   r   r   replace_input_of_all_nodes     z$ONNXModel.replace_input_of_all_nodesc                 C   ,   | j jjD ]}|j|v rt||| qd S r   )r1   r0   r
   r   r>   r   )r?   r   r   node_names_setr
   r   r   r   replace_input_of_nodes  
   
z ONNXModel.replace_input_of_nodesc                 C   r   r   )r   r   r   rG   r   )r
   old_output_namenew_output_namer   r   r   r   replace_node_output  r   zONNXModel.replace_node_outputc                 C   r   r   )r1   r0   r
   r>   r   )r?   r   r   r
   r   r   r   replace_output_of_all_nodes  r   z%ONNXModel.replace_output_of_all_nodesc                 C   r   r   )r1   r0   r
   r   r>   r   )r?   r   r   r   r
   r   r   r   replace_output_of_nodes  r   z!ONNXModel.replace_output_of_nodesc                 C   s   |   }g }|  }|D ]}|jdkr'| |jd s'|jd |vr'|| q| | g }|  D ](}|j|vr[| |js[|| | 	 j
D ]}|j|jkrZ| 	 j
| qJq3| | d S )Nrp   r   )r   rD   r'   is_graph_outputr   r$   rY   r+   r   r0   r   r,   r{   )r?   r   unused_nodesrD   r
   ununsed_weightswgraph_inputr   r   r   remove_unused_constant  s(   



z ONNXModel.remove_unused_constantc                       t  fdd| jjjD S )Nc                 3       | ]}|j  kV  qd S r   r   )r	   r   rf   r   r   r         z,ONNXModel.is_graph_output.<locals>.<genexpr>)anyr1   r0   r   )r?   rf   r   r   r   r      r]   zONNXModel.is_graph_outputreturnc                    r   )Nc                 3   r   r   r   r   rh   r   r   r     r   z+ONNXModel.is_graph_input.<locals>.<genexpr>)r   r1   r0   r   )r?   rh   r   r   r   is_graph_input  r]   zONNXModel.is_graph_inputc                 C   s  dgt |   }i }g }t|  D ]:\}}tdd |jD ||< || dkr3||  |  q|jD ]}|s;q6||vrE|g||< q6|| | q6qdd |  D }dd | jjjD }|| }	|		  d }
|	D ]+}|
|krtqm|}
||v r|| D ]}|| d ||< || dkr||  |  q~qmd}t |}||k r|| j
D ](}||v r|| D ]}|| d ||< || dkr||  |  |d }qq|d }||k s|t |  jksJ d|  d	 |  j| d S )
Nr   c                 s   s    | ]}|rd V  qdS )r   Nr   )r	   _r   r   r   r     s    z-ONNXModel.topological_sort.<locals>.<genexpr>c                 S      g | ]}|j qS r   r   )r	   rK   r   r   r   r     rw   z.ONNXModel.topological_sort.<locals>.<listcomp>c                 S   r   r   r   r   r   r   r   r     rw   r   zGraph is not a DAGr
   )rG   rD   	enumeratesumr   r$   r+   r1   r0   sortr   r
   r(   r)   )r?   
deps_countdeps_to_nodessorted_nodesnode_idxr
   r   r}   graph_input_namesinput_namesprev_input_namestartr   r   r   r   r   r     s\   

zONNXModel.topological_sortc                 C   s   t |  | jS r   )r!   r0   r1   rC   r   r   r   clean_initializers<  s   zONNXModel.clean_initializersc                 C   sJ   |j tjjkr#|dr#t|j}ttdd |r#t	d|j
d|S )Nraw_datac                 S   s   | d@ dkS )N   r   )ir   r   r   <lambda>C  s    z'ONNXModel._check_init.<locals>.<lambda>zInitializer z	 has nan.)	data_typer   TensorProtoFLOAT8E4M3FNHasFieldr   r   r   maprH   r   )r?   rK   testbr   r   r   rI   ?  s   

zONNXModel._check_initc                 C   sX   |j dkr*|jd }| |}|j}|tjjtjjtjjtjj	hv r*t
d| d|S )z
        A quantization to float 8 does not use quantized bias but float 16 bias.
        This function checks that DequantizeLinear is not used to
        dequantize from float 16.
        DequantizeLinearr   z;Unsupported DequantizeLinear operator, dequantization from .)r'   r   rc   r   r   r   FLOAT16FLOATDOUBLEBFLOAT16RuntimeError)r?   r
   
zero_pointrK   dtyper   r   r   r[   G  s   


zONNXModel._check_noder   )F)7__name__
__module____qualname__r   r@   rD   r+   rL   r0   r.   rO   rT   rV   rY   r\   r_   ra   rc   re   rg   r   ro   ru   rx   ry   r{   r   r   r   r   r   r   r   r   r   r   staticmethodr   r   r   r   r   r   r   r   r   r   r   r   boolr   r   r   rI   r[   r   r   r   r   r>   Y   sj    	





]


4
r>   )pathlibr   r   onnx.helperhelperr%   onnx.numpy_helpernumpy_helperrr   onnx.onnx_pbr   quant_utilsr   r   r!   r>   r   r   r   r   <module>   s   J