
    Vh                        U d dl Z d dlZd dlZd dlZd dlZd dlZd dlZd dlZd dlZd dl	Z	d dl
Z	d dlZd dlZd dlZd dlZd dlZd dlmZ d dlmZmZmZmZmZ d dlmZ d dlZd dlmZmZmZ d dlmZ d dl m!Z! d dl"m#Z# d d	l$m%Z% d d
l&m'Z' d dl(m)Z)m*Z* d dl+m,Z, d dl-m.Z. d dl/m0Z0 d dl1m2Z2 ddl3m4Z4m5Z5 ddl6m7Z7m8Z8m9Z9m:Z:m;Z; ddl<m=Z=  ej|                  e?      Z@ e%e?d      ZA e%e?d      ZBeCe   ZD e j                  dddg      ZFg dZG ej                  d      deIfd       ZJ	 	 dDdeCe7   deIdeeK   ddfdZLd eCe7   dej                  fd!ZN	 	 dEdeeD   d"eOeKeKf   d#eeK   d$ePddf
d%ZQd"eOeKeKf   deOeKeFf   fd&ZRd'ej>                  jN                  d eDddfd(ZSej                  ded   fd)       ZUi ZVeOeKef   eWd*<   dZXeeP   eWd+<    G d, d-      ZY G d. d/      ZZdeDddfd0Z[deDddfd1Z\ej                   G d2 d3             Z^ ej                         Z`d4ePd5eOeKef   d6eOeKef   deOeKeOeKef   f   fd7Zad8ed9eddfd:Zbd;eKdefd<Zcdd=d>ed?eKf   d@ej                  j                  dAeOeKef   dBee.   deKf
dCZfy)F    N)Iterator)AnyCallableIOOptionalUnion)patch)
draw_graphget_aot_graph_nameget_graph_being_compiled)fx)save_graph_repro)get_debug_dir)getArtifactLogger)GraphModule)_extract_tensor_metadataTensorMetadata)legalize_graph)FileLike)
OrderedSet)tree_map   )configir)BaseSchedulerNodeFusedSchedulerNodeNopKernelSchedulerNode
OutputNodeSchedulerNode)Vir_pre_fusionir_post_fusionBufMetanamen_origin)dotz-Gnslimit=2z-Gnslimit1=2z-Gmaxiter=5000returnc                      	 t        j                  ddgt         j                         y# t         j                  $ r Y yw xY w)Nwhichr&   )stderrTF)
subprocesscheck_outputPIPESubprocessError     E/home/dcms/DCMS/lib/python3.12/site-packages/torch/_inductor/debug.pyhas_dotr2   6   s;    % 0I%% s   '* A A nodesprint_graphfnamec           
         t               st        j                  d       y|
t               }t	        |       }|j
                  D ]  }d|j                  vr|j                  d   j                  }t        |t              rt        |d   t              r|d   f}n|d   }d}t        |t        j                        r|j                  j                  }t        ||ddddd      }||j                  d<    |rt!        |       t#        i |      }t%        |       |j&                  j)                          t+        ||dt,        j.                  j0                         y)z$
    Draw a graph in fname.svg.
    z*draw_buffers() requires `graphviz` packageNfusion_metar   tensor_metaF)
clear_metadot_graph_shape)r2   logwarningr   create_fx_from_snodesr3   metagroup
isinstancetupleintr   ComputedBufferdatadtyper   printr   r   graphlintr
   r   tracer:   )	r3   r4   r5   rG   noder?   rE   metadatagms	            r1   draw_buffersrM   ?   s"    9@A}(*!%(E ,		)		-(..eU#%(C(qa dB--.IIOOE!%dD$M#+		- !,$ e	R	B2HHMMO
EeV\\5Q5Qr0   snodesc                 
   dt         dt        dt        f   fd}t        j                  dg d      }i }i }t
        j                  j                         }d}g }d}| D ]  }	|	j                         rd}
|
}ns|	j                         rd	}
|
}n^t        |	t              rd
}
|
}nIt        |	t              rd}
|	j                  }n*t        |	t              rd}
|	j                  }nt        d      t
        j                   j"                  j%                  |	j'                         d      }|
 d| } ||      }i }t)        |	d      rd|	j+                         i}|j-                  |d|      }dt.        t0        t        f   dt2        ffd |	      r|j5                  |       |	j7                         }||_         |||	|
      |j:                  d<   |||<   |	j=                         D ]  }|||j7                         <    ||} | D ]  }	|	j7                         }|	j>                  j@                  }||   }g }|D ]{  }|j8                  |v r||j8                     }nD|jC                  |      5  |jE                  |j8                        }|||j8                  <   ddd       |k(  rk|j5                  |       } tG        |      |_$         |jK                  tM        |      dk(  r|d          |S tG        |             |S # 1 sw Y   ixY w)B
    Creates a FX Graph from a list of SchedulerNode objects.
    r$   r'   .c                 4    dt         dt        fd}| |_        |S )Nargsr'   c                       yNr   r/   )rR   s    r1   func1z;create_fx_from_snodes.<locals>.get_fake_func.<locals>.func1s   s    r0   )r   rB   __name__)r$   rU   s     r1   get_fake_funcz,create_fx_from_snodes.<locals>.get_fake_funcr   s#    	 	 	 r0   
FusionMeta)r?   snodetypeNexterntemplatenopcomputefusedzUnknown node typeoriginal_atenz: 
get_devicedevicer/   rR   kwargsrY   c                     t        | t              rt        fd| j                  D              S t        d | j	                         D              S )Nc              3   .   K   | ]  } |        y wNr/   ).0x	in_outputs     r1   	<genexpr>z;create_fx_from_snodes.<locals>.in_output.<locals>.<genexpr>   s     >A9Q<>s   c              3   r   K   | ]/  }|j                   D ]  }t        |j                  t                 1 y wrg   )usersr@   rJ   r   )rh   bufusers      r1   rk   z;create_fx_from_snodes.<locals>.in_output.<locals>.<genexpr>   s<      II  499j11s   57)r@   r   anyrN   get_outputs)rY   rj   s    r1   rj   z(create_fx_from_snodes.<locals>.in_output   sF    %!34>>>>  ,,.  r0   r7   r   r   )'strr   rB   collections
namedtupletorchr   Graph	is_externis_templater@   r   r   r?   r   RuntimeError	_inductorutilsget_fused_kernel_name	get_nodeshasattrra   call_functionr   r   boolappendget_namer$   r>   rq   read_writesreadsinserting_beforeplaceholderrA   rR   outputlen)rN   rW   rX   buf_to_fx_nodenode_to_fx_noderG   
first_nodeoutputsr?   rY   	node_type
fused_name	func_name	node_funcrd   fx_noder$   rn   depsnew_argsdepdep_noderj   s                         @r1   r=   r=   m   s   
C HS#X$6  ''6PQJNOHHNNEJGE 2!?? IE "IE56IE}-!IKKE12IKKE233__**@@OO

 !kJ<0	!),	5,' 0 0 23F%%ib%H	U#46H#HI 	d 	 UNN7#~~&0y&I]# '$$& 	5C-4N3<<>*	5  Je2!j  '~~  &&!$' 		&Cxx>))#((3++J7 8$00:H/7N388,8 7"OOH%		& X#'& 
LLs7|q0EL 7<GnEL8 8s   &+K99Lnode_name_to_buf_nameparent_buf_name	n_originsc                 X   | y | D ]  }|j                         }|j                         }| t        |      dkD  rt        ||||n|       Et        |      dk(  r|d   |k(  sJ |j                  }||j
                  x|j
                  D ]  }|j                  }	|	|vs||n|||	<     y )Nr   r   )r   r}   r   $update_orig_fx_node_name_to_buf_namerJ   originsr$   )
r3   r   r   r   rJ   buf_namechildren_nodesir_nodeorigin	node_names
             r1   r   r      s     } ==?)%#n*=*A0%+3
 ~&!+q0AT0III))?goo5oo 	FI  55 / 7H_ &i0	#r0   c                     i }| j                         D ]-  \  }}||vrt        |g      ||<   ||   j                  |       / i }| j                         D ]"  \  }}t        ||         }t	        ||      ||<   $ |S rg   )itemsr   addr   r#   )r   buf_name_to_n_noder   r   node_name_to_buf_metan_nodes         r1   get_node_name_to_buf_metar      s     4::< 8	8--+5yk+Bx(x(,,Y7	8 4::< E	8'12+28V+Di(E ! r0   rL   c                     i }t        ||       |yt        |      }| j                  j                  D ]9  }|j                  |v s|j                  |j                        |j                  d<   ; y)rP   Nbuf_meta)r   r   rG   r3   r$   getr>   )rL   rN   r   r   rJ   s        r1   annotate_orig_fx_with_snodesr     sm     -/(1FG$56KL I99--$9$=$=dii$HDIIj!Ir0   c               #     K   t         j                  j                  dd      dk(  } dd l}t	        j
                  |j                  j                  j                        }t        j                         }| s	 d  |j                          y |j                  t        dd             t         j                  j                  t!               d      }t        j"                  |d       t	        j$                  t         j                  j                  |d	t'                d
            }|j)                  t        j*                         |j-                  t	        j.                  d             |j1                  |       	 d  |j3                  |       |j                          y # |j                          w xY w# |j3                  |       |j                          w xY ww)NTORCH_COMPILE_DEBUG01r   z*functorch.compile.config.debug_partitionerTtorchinductor)exist_okaot_z
_debug.log3[%(filename)s:%(lineno)d %(levelname)s] %(message)s)osenvironr   torch._functorch.aot_autogradlogging	getLogger
_functorchaot_autogradrV   
contextlib	ExitStackcloseenter_contextr	   pathjoinr   makedirsFileHandlerr   setLevelDEBUGsetFormatter	Formatter
addHandlerremoveHandler)compile_debugru   r;   stackr   fhs         r1   enable_aot_loggingr     sZ    JJNN#8#>#EM(


E,,99BB
CC  "E	KKM 
JDQR77<<9DKKt$			
%'(
3	

B KKOOOP NN2"3 KKM0 	"s7   A1G4F 8C>G7F2 ;"GF//G2#GG _inductor_post_to_pre_grad_nodes_pre_grad_graph_idc                   ~   e Zd ZU  ej                         Zi Zeee	e   f   e
d<   ededee   fd       ZddZdeddfdZ	 dd	ed
edededee   f
dZej(                  	 dd	ed
edededeee      f
d       ZdedefdZddZddZd	ededdfdZdeee      dee   dee   ddfdZddZdedee d      fdZ!y)DebugContext._inductor_triton_kernel_to_post_grad_node_infofolder_namer'   c                 6   t         j                  j                  xs
 t               }t        j
                  D ]`  }t        j                  j                  |d|  d|       }t        j                  j                  |      rIt        j                  |       |c S  y )Nr   .)r   rI   	debug_dirr   r   _counterr   r   r   existsr   )r   r   ndirnames       r1   create_debug_dirzDebugContext.create_debug_dirJ  s{    LL**=mo	&& 	Aggll-q$G
 77>>'*G$	 r0   Nc                 R    d | _         d | _        t        j                         | _        y rg   )_prof_pathr   r   _stack)selfs    r1   __init__zDebugContext.__init__X  s     

 **,r0   new_pathc                    | j                   sy |j                  d      sJ |       ddlm} 	  || d      5  t        j
                  j                  |      rt        j                  |       t        j                  | j                   |       d d d        y # 1 sw Y   y xY w# t        $ r$ t        j                  d| j                   |       Y y w xY w)Nz.debugr   )FileLockz.lockz(Failed to copy debug files from %s to %s)r   endswithfilelockr   r   r   r   shutilrmtreecopytreeOSErrorr;   r<   )r   r   r   s      r1   copyzDebugContext.copy]  s    zz  *4H4*%	XJe,- 677>>(+MM(+

H56 6 6  	KK:DJJ	s/   B" ABB" BB" B" "*CCfilename
write_moderR   rd   c                     | j                   sJ t        t        j                  j	                  | j                   |      |g|i |S rg   r   openr   r   r   )r   r   r   rR   rd   s        r1   fopenzDebugContext.fopenm  s:     zzzBGGLLX6
TTTVTTr0   c              /      K   | j                   sJ t        t        j                  j	                  | j                   |      |g|i |5 }| d d d        y # 1 sw Y   y xY wwrg   r   )r   r   r   rR   rd   fs         r1   fopen_contextzDebugContext.fopen_contextw  sW      zzz"'',,tzz84jR4R6R 	VWG	 	 	s   AA#	A	A#A A#suffixc                 r    | j                   sJ t        j                  j                  | j                   |      S rg   )r   r   r   r   )r   r   s     r1   r   zDebugContext.filename  s'    zzzww||DJJ//r0   c                    t         j                  j                  dd l}| j                  sJ t
        j                  j                  | j                  t
        j                  j                  | j                         d      }|j                  |d      5 }|j                  | j                  t
        j                  j                  | j                               d d d        t         j                  j                  |       y y # 1 sw Y   *xY w)Nr   z.tar.gzzw:gz)arcname)r   rI   
upload_tartarfiler   r   r   r   basenamer   r   )r   r   tar_filetars       r1   r   zDebugContext.upload_tar  s    <<"".:::ww||

rww//

;<GDH h/ J3

BGG,<,<TZZ,HIJLL##H- /J Js   ADD
c                    t         j                  rjt        j                  d      j                  }j                  t        j                         dt        dd ffd}| j                  j                  ||       | j                  j                  t        j                  |              t         j                  j                  sy | j                  t!                     | _        t         j                  j$                  r | j'                  dt        j                         t         j                  j(                  r!| j'                  dt        j*                         y y )Nztorch._dynamolevelr'   c                 (    j                  |        y rg   )r   )r   r;   s    r1   reset_log_levelz/DebugContext.__enter__.<locals>.reset_log_level  s    U#r0   z	debug.logzinfo.log)r   debugr   r   r   r   r   r   r   callbackr   r    set_debug_handlerrI   enabledr   r   r   	debug_log_setup_log_captureinfo_logINFO)r   
prev_levelr   r;   s      @r1   	__enter__zDebugContext.__enter__  s    <<##O4CJLL'$s $t $ KK  *=!!!"5"5d";<||##**+=+?@
<<!!##K?<<  ##J= !r0   r   c                    t        j                  d      }| j                  j                  | j	                  |            }t        j
                  |      }|j                  |       |j                  t        j                  d             |j                  |       |j                  t        |j                  |             | j                  j                  |j                  |       y )Nztorch._inductorr   )r   r   r   r   r   StreamHandlerr   r   r   r   minr   r  r   )r   r   r   r;   fdchs         r1   r  zDebugContext._setup_log_capture  s    
  12[[&&tzz(';<""2&
E
ST	
 	rSE*+S..3r0   exc_typeexc_valexc_tbc                 .   | j                   r*| j                   j                          | j                          | j                  r9| j	                          t
        j                  dt               | j                         | j                  j                          y )Nz%s debug trace: %s)
r   disable_save_profile_datar   r   r;   r<   r   r   r   )r   r  r  r  s       r1   __exit__zDebugContext.__exit__  sa     ::JJ ##%::OOKK,.F.H$**Ur0   c                    | j                   sJ | j                   j                  | j                  d             | j                  d      5 }t	        j
                  | j                   |      }|j                          |j                  d       |j                  d       |j                  d       |j                  d       d d d        y # 1 sw Y   y xY w)Nzcompile.profzcompile.stats)streamcumtimed   tottime)	r   
dump_statsr   r   pstatsStats
strip_dirs
sort_statsprint_stats)r   r  statss      r1   r  zDebugContext._save_profile_data  s    zzz

dmmN;<ZZ( 	#BLLB7EY'c"Y'c"	# 	# 	#s   
A6C		Cr$   ).Nc                 
   t         j                  j                  r0t        t         j                  |      r	 t        t	        |       |      S dt        dt        dd fd}|S # t
        $ r t        j                  dd       Y y w xY w)Nz Ignoring exception in debug codeT)exc_inforR   rd   r'   c                       y rg   r/   rc   s     r1   ignoredz)DebugContext.__getattr__.<locals>.ignored  s    r0   )	r   rI   r  getattrDebugFormatter	Exceptionr;   r<   r   )r   r$   r&  s      r1   __getattr__zDebugContext.__getattr__  sy    <<GFLL$$?~d3T::s c d  N  >Ns   A  BB)r'   N)w)"rV   
__module____qualname__	itertoolscountr   r   dictrr   list__annotations__staticmethodr   r   r   r   r   r   r   r   contextmanagerr   r   r   r   r
  rB   r  rZ   BaseExceptionr  r  r   r*  r/   r0   r1   r   r   D  s   y H LN2Dd3i4HMc hsm  -
S T & UU U 	U
 U 
CU  		 	 		
 	 
"S'		 	0s 0s 0
.>.44 4 
	4 4./ -( 	
 
	# )1D(E r0   r   c                      e Zd ZdeddfdZdej                  j                  deej                     ddfdZ
dej                  j                  deej                     ddfdZd	eddfd
Zd	eddfdZed	edefd       Zd	eddfdZdej                  j                  d	eddfdZdeddfdZ	 ddedeeeee   f   eeef   f   fdZdedeej4                     dedef   dededdfdZy)r(  handlerr'   Nc                 x    |j                   | _         |j                  | _        |j                  | _        || _        y rg   )r   r   r   r7  )r   r7  s     r1   r   zDebugFormatter.__init__  s/    ]]
$22((r0   rL   inputsc           
         | j                  d      5 }d }t        j                  j                  j                  j
                  rRt        j                  j                  j                  |      }t        j                  j                  |j                        }t        j                  j                  j                  j
                  }t        j                  j                  j                  ddd      5  t        |||d||       d d d        d d d        | j                  d      5 }|j                  |j!                  d             d d d        y # 1 sw Y   MxY w# 1 sw Y   QxY w# 1 sw Y   y xY w)Nzfx_graph_runnable.pyF)ztrace.enabledztrace.save_real_tensorsinductor)save_dirstable_hashzfx_graph_readable.pyprint_output)r   ru   rz   r   rI   save_real_tensors_subclasses
fake_utilstry_convert_fake_to_realr   r   r   r$   r	   r   writeprint_readable)r   rL   r9  r  r<  r=  s         r1   fx_graphzDebugFormatter.fx_graph  s+   
 ZZ./ 	2H%%++==**55NNvV77??2773
  //0066HHK''--"'EJ 
 !% +
	, ZZ./ 	<2HHR&&E&:;	< 	<
 
	 	,	< 	<s0   CE/EE""E%E	EE"%E.c                     | j                  d      5 }|j                  |j                  d             d d d        y # 1 sw Y   y xY w)Nzfx_graph_transformed.pyFr>  )r   rD  rE  )r   rL   r9  r  s       r1   fx_graph_transformedz#DebugFormatter.fx_graph_transformed  sB    
 ZZ12 	<bHHR&&E&:;	< 	< 	<s	   "=Ar3   c                     | j                  d      5 }|j                  | j                  |             d d d        y # 1 sw Y   y xY w)Nzir_pre_fusion.txtr   rD  	_write_irr   r3   r  s      r1   r!   zDebugFormatter.ir_pre_fusion  s;    ZZ+, 	,HHT^^E*+	, 	, 	,	   !<Ac                     | j                  d      5 }|j                  | j                  |             d d d        y # 1 sw Y   y xY w)Nzir_post_fusion.txtrJ  rL  s      r1   r"   zDebugFormatter.ir_post_fusion  s;    ZZ,- 	,HHT^^E*+	, 	, 	,rM  c                     t        j                         }| D ]2  }|j                  |j                                |j                  d       4 |j	                         S )Nz


)ioStringIOrD  	debug_strgetvalue)r3   rn   rJ   s      r1   rK  zDebugFormatter._write_ir  sI    kkm 	 DIIdnn&'IIh	  ||~r0   c                 <    t        || j                  d             y )Nzgraph_diagram.svg)r5   )rM   r   )r   r3   s     r1   graph_diagramzDebugFormatter.graph_diagram   s    U$--0C"DEr0   c                     t        ||       t        || j                  d      dt        dt        j
                  j                         y )Nzorig_fx_graph_diagram.svgFT)r5   r9   progparse_stack_tracer:   )r   r
   r   GRAPHVIZ_COMMAND_SCALABLEr   rI   r:   )r   rL   r3   s      r1   draw_orig_fx_graphz!DebugFormatter.draw_orig_fx_graph#  s<    
 	%R/-- ;<*""LL88	
r0   r   c                 N    t        j                  || j                  d             y )Nzoutput_code.py)r   r   r   )r   r   s     r1   output_codezDebugFormatter.output_code2  s    Hdmm,<=>r0   c                    i }| j                  |d      5 }t        j                  d|j                         t        j
                  }t        j                  ||       d d d        i }t        rJ| j                  dd      5 }t        t        t        |      }t        j                  ||       d d d        ||fS ||fS # 1 sw Y   _xY w# 1 sw Y   ||fS xY w)Nr+  z/Writing provenance tracing debugging info to %sz/inductor_provenance_tracking_node_mappings.json)r   r;   infor$   r   r   jsondumpr   create_node_mappingr   )r   r   
debug_infor  node_mappings        r1   1log_inductor_triton_kernel_to_post_grad_node_infoz@DebugFormatter.log_inductor_triton_kernel_to_post_grad_node_info5  s     
ZZ#& 	&"HHFP%TTJIIj"%	& A3 ,2&(H*  		,+, <''z<''	& 	&, <''s   AB:>,C:CCr$   input_nodestimingsChoiceCallerelapseprecompile_elapsec           	      L   ddl m dt         j                  dt        t        t        f   ffd|t
        j                  j                         t
        j                  j                         |D cg c]
  } |       c}||d}| j                  ddd	
      5 }|j                         D ][  \  }	}
t        |	j                               }|j                  |       |
|d<   t        j                  ||       |j                  d       ] 	 d d d        y c c}w # 1 sw Y   y xY w)Nr   )FixedLayoutrJ   r'   c           	          t        | d      r| j                  }nd}|t        |       j                  d}	 | j	                         }t        |      rd}	 t        |j                        } |j                  |j                  g t        j                  j                  j                  |j                         g t        j                  j                  j                  |j"                        |      }t%        |      |d<   nt%        |      |d<   	 t%        | j'                               |d<   	 t%        | j)                               |d	<   	 t%        t        j                  j                  j                  | j+                                     |d
<   	 t%        t        j                  j                  j                  | j-                                     |d<   	 t%        t        j                  j                  j                  | j/                                     |d<   t        | d      r9t        | j0                  t2        j4                        r | j0                        |d<   |S # t        $ rJ 	 t        j                  j                  j                  |j                  d      }n# t        $ r Y nw xY wY Cw xY w# t        $ r Y w xY w# t        $ r Y w xY w# t        $ r Y w xY w# t        $ r Y aw xY w# t        $ r Y -w xY w# t        $ r Y w xY w)Nr$    )r$   rZ   r   )fallback)rE   sizestrideoffsetlayoutrE   rb   rp  ro  numelrD   )r~   r$   rZ   rV   get_output_specr@   rB   rq  r)  r    rG   sizevars	size_hintrb   rE   
size_hintsro  rp  rr   	get_dtypera   
get_strideget_size	get_numelrD   r   IRNode)rJ   r   	node_inforr  rq  static_layoutrk  build_node_infos         r1   r  z>DebugFormatter.log_autotuning_results.<locals>.build_node_infoR  s   tV$ II		!T
++I--/fk2F!!$V]]!3 %0$llHqww//::6;;GHL!1!1!<!<V]]!KL%%M +.m*<Ih'*-f+Ih'%()9%:	'"&)$//*;&<	(#&)GG$$//0AB'	(#
$'(8(8(C(CDMMO(T$U	&!%()9)9)C)CDNNDT)U%V	'" tV$DIIryy)I$3DII$>	&!W % !!%&WW%5%5%?%? & &@ &F  ) ! !!"            s   J1 I *B$J1 K ,K 	AK! AK1 AL 	J.%5JJ.	J'$J.&J''J.*J1 -J..J1 1	J>=J>	KK	KK!	K.-K.1	K>=K>	LL)op_namecuda_device_namecuda_device_countre  autotuning_timeprecompile_timezautotuning_result_json_list.txtatzutf-8)encodingbenchmark_result
)r   rk  r|  r0  rr   ru   cudaget_device_namedevice_countr   r   	info_dictupdater_  r`  rD  )r   r$   re  rf  rh  ri  rJ   general_propertiesr  callertimer  rk  r  s               @@r1   log_autotuning_resultsz%DebugFormatter.log_autotuning_resultsH  s    	$:	")) :	S#X :	z  %

 : : <!&!8!8!:>IJdOD1J%0
 -tg   
 	 '  !1!1!34	  !3404	,-		)R(	 		 K	 	s   2D
A/DD#)z.inductor_triton_kernel_to_post_grad_nodes.json)rV   r,  r-  r   r   ru   r   r   r1  TensorrF  rH  SchedulerNodeListr!   r"   r3  rr   rK  rU  rZ  r\  rA   r0  r   rd  r   r|  floatr  r/   r0   r1   r(  r(    s     <HH  < U\\"< 
	<<<HH  < U\\"< 
	<,#4 , ,,$5 ,$ , * s  F#4 F F
HH  
 !
 
	
?C ?D ? O((	tCcN#T#s(^3	4(&VV "))_V ne+,	V
 V !V 
Vr0   r(  c                     t         j                  t        j                        r)t         j	                  dt
        j                  |              t        j                  j                  |        y )NzBEFORE FUSION
%s)
ir_pre_fusion_logisEnabledForr   r  r^  r(  rK  r    r  r!   r3   s    r1   log_ir_pre_fusionr    sB    %%gll32N4L4LU4STGG% r0   c                     t         j                  t        j                        r)t         j	                  dt
        j                  |              t        j                  j                  |        y )NzAFTER FUSION
%s)
ir_post_fusion_logr  r   r  r^  r(  rK  r    r  r"   r  s    r1   log_ir_post_fusionr    sB    &&w||4 2N4L4LU4STGG5!r0   c                   6    e Zd ZU eed<   ej                  ed<   y)TensorMetadataHoldertensor_metadatarb   N)rV   r,  r-  r   r2  ru   rb   r/   r0   r1   r  r    s    ##LLr0   r  pre_grad_graph_idpost_to_pre_grad_nodes_jsontriton_kernel_to_post_grad_jsonc           	         i i i i d}t         j                  d       t        |t              st         j	                  d       |S t        |t              st         j	                  d       |S t        | t
              st         j	                  d       |S t        j                  t              }t        j                  t              }t        j                  t              }	 |j                         D ]I  \  }}t        |t              st         j	                  d       |c S |D ]  }	||	   j                  |        K dt        t        t        f   dt        fd	}
|j                         D ]<  \  }}t        |t              st         j	                  d
       |c S |D ]  } |
|      s|c c S |j                  d      | k(  r.||d      j                  |       ||   j                  |d          |j                  dg       D cg c]  }||f }}|sx|j!                         \  } |
|      s|c c S |j                  d      | k(  r.||d      j                         |   j                  |d          |j#                  fd|j                  dg       D               |r
 ? dt        t        t        f   ddfd} ||        ||        ||       ||||dS c c}w # t$        $ r}t         j	                  d|       t         j	                  d|       t         j	                  d|       t         j	                  d|        t         j	                  t'        j(                                |cY d}~S d}~ww xY w)zCreate bidirectional mappings between:

    - pre_grad graph nodes and post_grad graph code nodes, and vice versa
    - triton kernel name and post_grad graph code nodes, and vice versa
    )	preToPost	postToPrecppCodeToPostpostToCppCodez.Creating node mappings for provenance trackingzCProvenance tacking error: post_to_pre_grad_nodes_json is not a dictzGProvenance tacking error: triton_kernel_to_post_grad_json is not a dictz9Provenance tacking error: pre_grad_graph_id is not an intzMProvenance tacking error: triton_kernel_to_post_grad_json value is not a listrJ   r'   c                     t        | t              st        j                  d       yd| vsd| vsd| vrt        j                  d       yy)NzVProvenance tacking error: node provenance in post_to_pre_grad_nodes_json is not a dictFgraph_idr$   	from_nodezYProvenance tacking error: node provenance in post_to_pre_grad_nodes_json has wrong formatT)r@   r0  r;   error)rJ   s    r1   check_formatz)create_node_mapping.<locals>.check_format  sN    dD)		l %t);{RV?V		o r0   zIProvenance tacking error: post_to_pre_grad_nodes_json value is not a listr  r$   r  c              3   &   K   | ]  }|f 
 y wrg   r/   )rh   r   
parent_keys     r1   rk   z&create_node_mapping.<locals>.<genexpr>  s      !,-J!s   dNc                 J    | D ]  }t        | |         | |<    t        |       } y rg   )r1  r0  )r  keys     r1   convert_sets_to_listsz2create_node_mapping.<locals>.convert_sets_to_lists  s+     &af#&QAr0   z+Unexpected error in create_node_mapping: %sz post_to_pre_grad_nodes_json:  %sz$triton_kernel_to_post_grad_json:  %szpre_grad_graph_id:  %s)r;   r^  r@   r0  r  rB   rs   defaultdictr   r   r1  r   rr   r   r   r   popextendr)  	traceback
format_exc)r  r  r  empty_returnpre_to_postpost_to_prepost_to_cpp_code	outer_key
node_array	curr_noder  rJ   r   r   current_noder  er  s                    @r1   ra  ra    sM    	/L HH=>148		WX5t<		U	
 '-		MN"-"9"9*"EK"-"9"9*"EK'2'>'>z'JK%D%J%J%L 	;!Izj$/		c $#' ;	 +//	:;	;	tCH~ 	$ 	 &A%F%F%H 	!Izj$/		_ $#" #D)''88J'+<<V-11)<	*..tF|< 26+r1JKA!YKK/4yy{,L*'5++#''
37HH#L$89==jI#J/33L4HILL !1=1A1A+r1R!  	6	T#s(^ 	 	 	k*k*./$$<-	
 	
+ L6  
 			?C		46QR		24S	
 			*,=>		)&&()
sX   >K% A9K% K% ,AK% K K%  K% 3A.K% "=K%  K% %	M9.B M4.M94M9rR   rd   c                     d}t         j                  j                  |      st        j                  |       dt        dt        fd}t        || |f      \  }}d}| d| dt        t               d}t        |d	      5 }t        j                  ||f|       d
d
d
       t        j                  t        j                        rd| d|d}	t        |	       y
y
# 1 sw Y   BxY w)z
    This function is used to save arguments for a compile_fx_inner function call
    to the file system.  Later on one can replay the compile_fx_inner call
    with the saved arguments using load_args_and_run_compile_fx_inner.
    z/tmp/inductor_saved_argsri   r'   c                 x    t        | t        j                        rt        t	        |       | j
                        S | S )z
        Pickle FakeTensor will result in error:
        AttributeError: Can't pickle local object 'WeakValueDictionary.__init__.<locals>.remove'

        Convert all Tensor to metadata. This may also makes pickle faster.
        )r@   ru   r  r  r   rb   ri   s    r1   handle_tensorz5save_args_for_compile_fx_inner.<locals>.handle_tensor9  s.     a&'(@(CQXXNNHr0   compile_fx_inner/_z.pklwbNz3
Arguments for a compile_fx_inner call is saved to z. To replay the call,
run the following:

from torch._inductor.debug import load_args_and_run_compile_fx_inner
load_args_and_run_compile_fx_inner(z
)
        )r   r   r   mkdirr   r   nextsave_args_cntr   pickler`  r;   r  r   r   rF   )
rR   rd   folderr  args_to_savekwargs_to_savefn_namer   r   messages
             r1   save_args_for_compile_fx_innerr  .  s     (F77>>&!

 
 
 $,MD&>#J L. GXQwiqm!4 5T:D	dD	 7Q\>2A67 &337& 9$ %)8 ,	 	g '7 7s   >CC!r   c                    ddl m} t        | d      5 }t        j                  |      \  }}d d d        dt
        dt
        fd}t        j                  j                  d      }|5  t        j                  d	d
      5  t        |f      \  }} ||i |cd d d        cd d d        S # 1 sw Y   ~xY w# 1 sw Y   nxY wd d d        y # 1 sw Y   y xY w)Nr   )r  rbri   r'   c                 
   t        | t              rrt        j                  j                  j                  | j                  j                  | j                  j                  | j                  j                  | j                        S | S rg   )r@   r  ru   _dynamotestingrand_stridedr  shaperp  rE   rb   r  s    r1   r  z9load_args_and_run_compile_fx_inner.<locals>.handle_tensorb  se    a-.==((55!!''!!((!!''	  Hr0   T)allow_non_fake_inputs	save_argsF)torch._inductor.compile_fxr  r   r  loadr   ru   rA  FakeTensorModer   r	   r   )r   r  r   rR   rd   r  	fake_modes          r1   "load_args_and_run_compile_fx_innerr  \  s    ;	dD	 &Q{{1~f&	 	 	 !!00t0LI	 1FLLe4 1f~>f001 1 1& &1 1 1 1 1s/   B)&C
=B5	C
)B25B>	:C

C)package_pathfunc.exported_programinductor_configsr  c                   ddl m} ddlm} ddlm} ddlm} |j                  j                  }|j                         }	t        |	t        j                  j                        sJ |j                  \  }
}	 |r$|j                  j                   dk(  r ||d|       |r|j                  j                   d	k(  rt#        j$                  |	      }t#        j$                  |j                        }t#        j$                  |      } |||d   |d
   |      \  }}t'        |      }t        j(                  j)                  ||d      } | |j                         |||dd        | |	|
||||      S # |$ r(} ||dd|       t*        j-                  d       |d }~wt.        $ r2}|r)d}|j                  j                   d
k(  rd} ||d||       |d }~ww xY w)Nr   )AccuracyError)dump_to_minify)r   )_aoti_flatten_inputs   aot_inductor)options   r   F)strictTaccuracy)r  r  load_and_runcheck_accuracy)r  r  r  aot_inductor_accuracyminify)commandr  zAccuracy failedrun)torch._dynamo.debug_utilsr  torch._dynamo.repro.aotir  torch._inductorr   r  r  r  dump_aoti_minifiermoduler@   ru   r   r   example_inputsrepro_levelr   deepcopyrA   exportr;   r<   r)  )r  r  r  r  r  r  r   r  use_minifierrL   rR   rd   gm_copyexample_inputs_copyconfig_copyflat_example_inputstuple_inputsflattened_epr  r  s                       r1   aot_inductor_minifier_wrapperr  s  s    87&?&&99L		 	 	"Bb%((..///#22LD&>F//;;q@ (
 F//;;q@ mmB'G"&--0@0O0O"P--(89K/C#A&#A&#	0, !!45L <<..wU.SL##%!,)!) -%%
 	
  #$		
 	%& G""..!3 (	 s%   5C5E+ +G0#FG-GG)FNrT   )grs   r   r   dataclasses	functoolsrP  r.  r_  r   r   os.pathr  r  r   r+   r  collections.abcr   typingr   r   r   r   r   unittest.mockr	   ru   functorch.compiler
   r   r   r   torch._dynamo.repro.after_aotr   torch._dynamo.utilsr   torch._loggingr   torch.fx.graph_moduler   torch.fx.passes.shape_propr   r   torch.fx.passes.tools_commonr   torch.typesr   torch.utils._ordered_setr   torch.utils._pytreer   rm  r   r   	schedulerr   r   r   r   r   virtualizedr    r   rV   r;   r  r  r1  r  rt   r#   rY  	lru_cacher   r2   rr   rM   rv   r=   r0  rB   r   r   r   r4  r   r   r2  r   r   r(  r  r  	dataclassr  r/  r  ra  r  r  r  ExportedProgramr  r/   r0   r1   <module>r     s        	    	       $ 5 5   V V  : - , - O 7   / (    g!%h@ &x1AB I 
 +
 
 VZ,@
AT  T   +!"++ C=+ 
	+\_$'8"9 _bhh _J &*	 %& S>  c]  	 
 
 F!S>!	#w,!"III 
I" %HTN % %V 46  $sCx. 5$( HSM (\ \~{ {|!. !4 !"/ "D "   
  	!ss!%c3hs &*#s(^s 
#tCH~
	sl+# + + +\1S 1S 18 (,Q
38
Qll22Q 38n	Q
 8$Q 	Qr0   