U
    Mh                     @   s   d dl mZ d dlmZmZmZmZ d dlZd dlZd dl	Z	d dl
mZ eee dddZejjdd	d
Zeeeee f dddZdd Zdd ZdddedddZedd ZedddZedddZedddZdS )     )contextmanager)AnyListTuplecastN)Timer)filenamereturnc              	      s   d}d}d  d}g }t | }| |}t|D ]p\}}|dkrFq4||}	|	dkrZq4|d |	 }
||d   d   fdd|
jd	d
D }|d| q4W 5 Q R X |S )Nz<GRAPH_EXPORT>z</GRAPH_EXPORT> r      c                    s   g | ]}|t  d  qS N)len).0xpfx M/var/www/html/venv/lib/python3.8/site-packages/torch/utils/jit/log_extract.py
<listcomp>   s     zextract_ir.<locals>.<listcomp>T)keepends)openreadsplit	enumeratefind
splitlinesappendjoin)r   ZBEGINENDcurrentZgraphsfZ
split_strsiZ	split_strZend_locslinesr   r   r   
extract_ir	   s$    

r%   )inp_typec                 C   sb   |   }|  }|  }|  }|d k	s,t|d k	s8t|d k	sDt|d k	sPttj||||dS )N)sizestridedevicedtype)sizesstridesr)   r*   AssertionErrortorchZempty_strided)r&   r'   r(   r)   r*   r   r   r   make_tensor_from_type   s    r/   )irr	   c                 C   s
  t jj| dd}|  g }| D ]}t| t jjrN|t	
dd q$t| t jjrt|t	dd q$t| t jjrtt jj| }|t| q$t| t jjr|t	dddk q$td|  q$t jd|}t j|j ||fS )	NT)Zparse_tensor_constantsg?d   r   r   z,A default value is not implemented for type forward)r.   _CZparse_irZmakeMultiOutputIntoTupleinputs
isinstancetypeZ	FloatTyper   randomuniformZIntTyperandint
TensorTyper   r/   ZBoolTypeNotImplementedErrorZ_create_function_from_graphZ!_jit_pass_erase_shape_informationgraph)r0   r<   r4   ZinpZ
tensorTypefuncr   r   r   load_graph_and_inputs*   s"    r>   c                 C   s$   t d| |dd}| }|jd S )Nzfn(*inputs))fnr4   )stmtglobals  )r   Zblocked_autorangeZmedian)r?   r4   	test_runsttimesr   r   r   	time_cuda?   s    rF   c                 C   s6   t  }t|D ]}| |  qt  }|| | d S )NrB   )timeperf_counterrange)r?   r4   rC   r#   _er   r   r   time_cpuD   s
    
rL   
      )warmup_runsrC   )r	   c          	      C   sx   t | \}}t|D ]}||  qd }|D ] }t|tjr*|jjdk} qLq*|d k	sXt|rht|||n
t	|||}|S )Ncpu)
r>   rI   r5   r.   ZTensorr)   r6   r-   rL   rF   )	r0   r4   rO   rC   r<   rJ   Zis_cpuinputoutr   r   r   run_testK   s    
rS   c               	   o   s*   t jd}z
d V  W 5 t j| X d S )NF)r.   r3   Z_get_graph_executor_optimize)argskwargsZold_optimizer   r   r   no_fuserZ   s    
rV   c              
   C   s(   t   t| |W  5 Q R  S Q R X d S r   )rV   rS   r0   r4   r   r   r   run_baseline_no_fusionb   s    rX   c              
   C   sb   zN|rdgndg}t j|}t jd t| |W  5 Q R  W S Q R X W 5 t j| X d S )N)ZDYNAMICrM   )ZSTATICrM   Zfuser1)r.   jitZset_fusion_strategyfuserrS   )r0   r4   ZdynamicZ	old_stratZstratr   r   r   run_nncg   s    $r[   c              
   C   s.   t jd t| |W  5 Q R  S Q R X d S )NZfuser2)r.   rY   rZ   rS   rW   r   r   r   run_nvfuserp   s    r\   )
contextlibr   typingr   r   r   r   r7   r.   rG   Ztorch.utils.benchmarkr   strr%   r3   r:   r/   r>   rF   rL   floatrS   rV   rX   r[   r\   r   r   r   r   <module>   s    
	