
    Vh              !          U d Z ddlZddlZddlZddlZddlZddlZddlmZ ddl	m
Z
 ddl	mZ ddlmZ ddlmZ dd	lmZmZ dd
lmZ ddlZddlZ G d de      Z G d d      Zeeef   ZdZi Zeed<   	 dddZg dZ G d de       Z!d Z" G d d      Z# G d d      Z$dedefdZ%dedede&fd Z'd! Z(	 	 	 	 	 d]d"ed#ed$eded%e&d&e&dee   fd'Z)d(ed)ed*ed+ed,eee*f   d-e&d&e&d.e$d/e&ddfd0Z+d1 Z,d2 Z- ej\                  d3      Z/d4 Z0d5 Z1d6 Z2d7 Z3 ej\                  d8      Z4d9 Z5 ej\                  d:      Z6d; Z7 ej\                  d<      Z8d= Z9d^d>Z:d? Z;d@ Z<dA Z=dB Z>dC Z? G dD dE      Z@ G dF dG      ZA eA       ZBi ZC eA       ZDi ZEeeeFf   edH<   i ZGe
D ]  ZH eIeHe      sJ eHj                         D ]  \  ZKZLeLd   ZMeLdd ZNej                  eNvr<eDj                  eK       ej                  eNv reEj                  eKdI      reMeGeK<   neMeEeK<   ej                  eNvsiej                  eNvsxeBj                  eK       eMeCeK<      ej\                  eBj                               ZU ej\                  dJeDj                          dK      ZV ej\                  dL      ZW ej\                  dM      ZX ej\                  dN      ZY ej\                  dO      ZZ	 d(ed)ed*ed+ed,eee*f   d-e&d&e&d.e$d/e&defdPZ[d^dQZ\dR Z]dS Z^ ej\                  dT      Z_dU Z`dV Za	 	 	 	 	 	 	 	 	 	 	 	 	 	 d_dWedXe&dedYed(ed+ed#edZed%e&d$ed/e&d-e&d&e&d[e&d.ee$   def d\Zby)`a   The Python Hipify script.
##
# Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
#               2017-2018 Advanced Micro Devices, Inc. and
#                         Facebook Inc. All rights reserved.
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
# THE SOFTWARE.
    N   )	constants)CUDA_TO_HIP_MAPPINGS)MATH_TRANSPILATIONS)Optional)Iterator)MappingIterable)Enumc                       e Zd ZdZdZy)CurrentStater      N)__name__
__module____qualname__INITIALIZEDDONE     P/home/dcms/DCMS/lib/python3.12/site-packages/torch/utils/hipify/hipify_python.pyr   r   -   s    KDr   r   c                       e Zd Zd Zd Zy)HipifyResultc                 .    || _         || _        d| _        y )N current_statehipified_pathstatus)selfr   r   s      r   __init__zHipifyResult.__init__2   s    **r   c                 T    d| j                    d| j                   d| j                   S )NzHipifyResult:: current_state: z, hipified_path : z
, status: r   r   s    r   __str__zHipifyResult.__str__7   sF    01C1C0DDVW[WiWiVjjtuy  vA  vA  uB  C  	Dr   N)r   r   r   r    r#   r   r   r   r   r   1   s    
Dr   r   z;// !!! This is a file automatically generated by hipify!!!
HIPIFY_FINAL_RESULTscalar_t)DtypeT)!
InputErroropenfbcolorsGeneratedFileCleanermatch_extensionsmatched_files_iterpreprocess_file_and_save_resultcompute_statsadd_dim3processKernelLaunchesfind_closure_groupfind_bracket_groupfind_parentheses_groupreplace_math_functionship_header_magicreplace_extern_sharedget_hip_file_pathis_out_of_placeis_pytorch_fileis_cusparse_fileis_special_fileis_caffe2_gpu_filer=   Triepreprocessorfile_specific_replacementfile_add_headerfix_static_global_kernelsextract_argumentsstr2boolr   r   hipifyc                   $     e Zd Z fdZd Z xZS )r(   c                 2    t         |   |       || _        y N)superr    message)r   rJ   	__class__s     r   r    zInputError.__init__N   s    !r   c                      d| j                    S )NzInput error: )rJ   r"   s    r   r#   zInputError.__str__R   s    t||n--r   )r   r   r   r    r#   __classcell__)rK   s   @r   r(   r(   K   s    .r   r(   c                     t        | |d      S )Nignore)errors)open)filenamemodes     r   r)   r)   V   s    $x00r   c                   ,    e Zd ZdZdZdZdZdZdZdZ	dZ
y	)
r*   z[95mz[94mz[92mz[93mz[91mz[0mz[1mz[4mN)r   r   r   HEADEROKBLUEOKGREENWARNINGFAILENDCBOLD	UNDERLINEr   r   r   r*   r*   [   s*    FFGGDDDIr   r*   c                   2    e Zd ZdZddZd Zd ZddZd Zy)	r+   z+Context Manager to clean up generated filesc                 >    || _         t               | _        g | _        y rH   )keep_intermediatessetfiles_to_cleandirs_to_clean)r   r_   s     r   r    zGeneratedFileCleaner.__init__p   s    "4!er   c                     | S rH   r   r"   s    r   	__enter__zGeneratedFileCleaner.__enter__u   s    r   c                     t         j                  j                  |      s8| j                  j	                  t         j                  j                  |             t        |g|i |S rH   )ospathexistsra   addabspathrQ   )r   fnargskwargss       r   rQ   zGeneratedFileCleaner.openx   sH    ww~~b!##BGGOOB$78B((((r   c                    t         j                  j                  |      \  }}|s"t         j                  j                  |      \  }}|r4|r2t         j                  j                  |      s| j	                  |d       t         j                  j                  |      r|sNt        j                  |       | j                  j                  t         j                  j                  |             y y )NT)exist_ok)
rf   rg   splitrh   makedirsisdirmkdirrb   appendrj   )r   dnro   parentns        r   rq   zGeneratedFileCleaner.makedirs}   s    GGMM"%	f-IFAav 6MM&4M0ww}}R HHRL%%bggoob&9: )1r   c                     | j                   sS| j                  D ]  }t        j                  |        | j                  d d d   D ]  }t        j
                  |        y y )N)r_   ra   rf   unlinkrb   rmdir)r   typevalue	tracebackfds         r   __exit__zGeneratedFileCleaner.__exit__   sY    &&(( 		!''"-  'r   NF)	r   r   r   __doc__r    rd   rQ   rq   r   r   r   r   r+   r+   n   s    5 
)
;r   r+   rg   returnc                 B    | j                  t        j                  d      S )N/)replacerf   sep)rg   s    r   _to_unix_pathr      s    <<$$r   rR   
extensionsc                 ,     t         fd|D              S )z<Helper method to see if filename ends with certain extensionc              3   @   K   | ]  }j                  |        y wrH   endswith).0erR   s     r   	<genexpr>z#match_extensions.<locals>.<genexpr>   s     8x  #8   any)rR   r   s   ` r   r,   r,      s    8Z888r   c                 ,     t         fd|D              S )Nc              3   J   K   | ]  }t        j                   |        y wrH   )fnmatch)r   patternfilepaths     r   r   z_fnmatch.<locals>.<genexpr>   s     Jgwx1Js    #r   )r   patternss   ` r   _fnmatchr      s    JJJJr   	root_pathincludesignoresout_of_place_onlyis_pytorch_extensionc              #     K   t        |      }t        j                  | d      D ]+  \  }}}	t        j                  j	                  ||       }
|
dk(  rPd|v r|j                  d       d|v r|j                  d       d|v r"|j                  d       |j                  d       |	D ]  }t        t        j                  j                  ||            }t        t        j                  j                  |
|            }t        ||      sbt        ||      rot        ||      s||v s|s%t        |      st        |      s|rt        |      s|  . y w)NT)topdown.z.gitbuildthird_partyzthird_party/nvfuser)r`   rf   walkrg   relpathremovert   r   joinr   r,   r:   r=   r9   )r   r   r   r   r   r   exact_matchesabs_dirpathdirs	filenamesrel_dirpathrR   r   rel_filepaths                 r   r-   r-      s(     MM +-'')T*J &dIggook9=#~F#$G$$M*12! 	H$RWW\\+x%HIH(k8)LML 8,!(G4%h
;x=?X+*<8AST`Aa (1N 	s   DEEE$1Eoutput_directoryr   	all_filesheader_include_dirsstatship_clang_launch	clean_ctxshow_progressc	                 f   t         j                  j                  t         j                  j                  | |            }	t	        t
        j                  |	      }
|
t        |	<   t        | ||||||||	      }|r2d|j                  vr$t        |	d|j                  |j                  d       |t        |	<   y )N)r   r   ignoredz->T)flush)rf   rg   rj   r   r   r   r   r$   r?   r   printr   )r   r   r   r   r   r   r   r   r   fin_pathhipify_resultresults               r   r.   r.      s     wwrww||,<hGHH |/G/GW_`M$1!*HiATV[*,@)]\F &--7d  &--t	= %+!r   c                     | d   D ch c]  \  }}|	 }}}t        dt        |      d       t        dj                  |             t        dt        | d         d       y c c}}w )Nunsupported_callsz1Total number of unsupported CUDA function calls: r   , z+
Total number of replaced kernel launches: kernel_launches)r   lenr   )r   	cuda_call	_filepathr   s       r   r/   r/      sx    AFGZA[\'=	9\\ 
=cBS>TUV=W
XY 
$))%
&' 
8UCT=U9VWX8Y
Z[ ]s   A&c                    d}d}| j                  dd      j                  dd      } t        d      D cg c]  }i  }}d||   d<   t        |       D ]b  \  }}|dkD  r nX|dk(  r|dz  }n
|d	k(  r|dz  }|d
k(  s|t        |       dz
  k(  s9|dk(  s?||d
k7  z   ||   d<   |dz  }|dk  sX|dz   ||   d<   d | |d   d   |d   d   dz    }| |d   d   |d   d    }	| |d   d   |d   d    j                  dd      j	                  d      }
| |d   d   |d   d    j                  dd      j	                  d      }d|
 d	}d| d	}|j                  |
|      }|	j                  ||      }|j                  ||	z   ||z         }|S c c}w )zBadds dim3() to the second and third arguments in the kernel launchr   <<<r   >>>r   startr   (),end
 zdim3()r   range	enumerater   strip)kernel_stringcuda_kernelcountclosure_arg_locsindcfirst_arg_rawsecond_arg_rawfirst_arg_cleansecond_arg_cleanfirst_arg_dim3second_arg_dim3first_arg_raw_dim3second_arg_raw_dim3s                   r   r0   r0      s   EG!))%4<<UBGM27(%;Qb%;H%; HUOGM* 3Q198qLG#XqLGHs=1A557a<%(AH%5HUOE"QJEqy+.7(3 "(1+g"6x{57IA7MNM"8A;w#7E8JKN#HQK$8!U9KLTTUY[]^ddehiO$Xa[%9(1+e:LMUUVZ\^_eefij_-Q/N./q1O&..O(001A?S%%mn&DFX[nFnoK7 &<s   	Fz([ ]+)(detail?)::[ ]+\\\n[ ]+c           
          t         j                  d          fd}d }d }t         | |                   } }|D ]  } ||      } j                  d|d         }	 |d   d   |	d	z    }
 |d   |d    }|d	   d   d
k(  rdnd	} |d   d   ||   d   d	z    }t	        ||
      }t        t        d|d   j                  dd      j                  dd                  }d|dd
 j                  ddd|z
  z  dz         j                  dd      j                  dd      j                  |d|z   dz         z   }|j                  |
|      }|d   j                  |         |S )zK Replace the CUDA style Kernel launches with the HIP style kernel launches.c                 L    | j                  d       | j                  d       dS )Nr   r   z::groupinps    r   <lambda>z'processKernelLaunches.<locals>.<lambda>  s!    1syy|nB.O r   c                     | d   | d   dddddddd}ddi}d}d}d	}d
}|}t        |d   d   dz
  dd      D ]  }
|   }	|||fv rJ|	dk(  r||k(  r
|}||d   d<   |dxx   dz  cc<   |	dk(  r$|dxx   dz  cc<   |d   dk(  r||k(  r
||d   d<   |}||k7  s^
|   j                         s
|   dv r-||k7  r
|}||d   d<   |dk(  sd|d   d<   |d   |d   |d   gc S ||k(  s||d   d<   |d   |d   |d   gc S  y )Nr   r   r   r   ry   )kernel_launchkernel_nametemplatez<>r   r   r      r   >r   <>   r   #r   r   :r   )r   isalnum)	in_kernelposr   STARTAT_TEMPLATEAFTER_TEMPLATEAT_KERNEL_NAMEr   icharstrings             r   grab_method_and_templatez7processKernelLaunches.<locals>.grab_method_and_template  s    (1'9)EBRS%'3"$R0
 q	  s?+G4q8"bA %	aA!9D %--3;!,12J.$K1$K3;$K1$KT{a'V{-B34J0!/ $!9$$&&)7P*P/!/45M*51 Av67M*73 "%]!3s:#oJ^`` /67M*73 "%]!3s:#oJ^``K%	ar   c                    d}g }| j                  d|      dk7  re| j                  d|      }| j                  d|      dz   }|dk  rt        d      |j                  ||| || d       | j                  d|      dk7  re|S )zKFinds the starting and ending points for all kernel launches in the string.r   r   ry   r   r   zno kernel end found)r   r   r   )findr(   rt   )r   
kernel_endkernel_positionskernel_starts       r   find_kernel_boundsz1processKernelLaunches.<locals>.find_kernel_boundsT  s    
 kk%,2!;;uj9L  UL9A=JQ !677 ##l:.4\:.N%P Q kk%,2  r   c                    d}d}d}| D ]z  }|dk(  r,|dk(  r|dk(  rd}nT|dk(  r|dk(  rd}nG|dk(  rB|dk7  r=|dk7  r8d}n5|dk(  r|d	k(  s|d
k(  r&d}n#|dk(  r|dk(  r|dk(  rd}n|dk(  r|dk(  r|dk7  rd}|}|dk(  r||z  }v|dz  }| |S )Nr   r   z//*z/*"\'r   xr   )r   
in_commentprev_c
new_stringr   s        r   mask_commentsz,processKernelLaunches.<locals>.mask_commentsl  s    

 	"AR8#!%J#X&C-!%J#X&D.Vs]!$Jt#9T	!#Jt#8#!#Js"8$!#JFRa
c!
3	"4 r   r   r   r   r   r   ry   r   r   r   r   zhipLaunchKernelGGL(z, 0   r   r   )	RE_KERNEL_LAUNCHsublistr   r0   r   rC   r   rt   )r   r   r   r  r  get_kernel_positionsoutput_stringkernelparamsparenthesisr   r   end_param_indexkernel_name_with_templatecuda_kernel_dim3num_klp
hip_kernels   `                r   r1   r1     s    !!"OQWXF9av 0B   2=3H IJM ' 4)&1 kk#ve}5 VAYw/a@vgve}=%ay/25!1$*6!9W+=f_>UV[>\_`>`$a!#M;?'6'?+B+B5#+N+V+VW\^a+bcd*-=a-C-K-K5AK(50.229'%2Fww4H !:CB[<[^a<abc

 &--k:F 	 ''
3144 r   c                     d}d}|}d\  }}|t        |       k  rM| |   |d   k(  r|du rd}d}|}n#|dz  }n| |   |d   k(  r|r|dz  }|dk(  r|}||fS |dz  }|t        |       k  rMy)a  Generalization for finding a balancing closure group

         if group = ["(", ")"], then finds the first balanced parentheses.
         if group = ["{", "}"], then finds the first balanced bracket.

    Given an input string, a starting position in the input string, and the group type,
    find_closure_group returns the positions of group[0] and group[1] as a tuple.

    Example:
        >>> find_closure_group("(hi)", 0, ["(", ")"])
        (0, 3)
    Fr   )ry   ry   Tr   )NN)r   )input_stringr   r   inside_parenthesisparensr   p_startp_ends           r   r2   r2     s     F
CNGU
L!
!a(!U*%)"!#%(*/AaKF{~%q L!
!  r   c                 "    t        | |ddg      S )z%Finds the first balanced parantheses.{}r   r2   r  r   s     r   r3   r3         lE#sDDr   c                 "    t        | |ddg      S )z!Finds the first balanced bracket.r   r   r   r&  r'  s     r   r4   r4     r(  r   z\bassert[ ]*\(c                 ^    | }t         D ]!  }|j                  | dt         |    d      }# |S )a  FIXME: Temporarily replace std:: invocations of math functions
        with non-std:: versions to prevent linker errors NOTE: This
        can lead to correctness issues when running tests, since the
        correct version of the math function (exp/expf) might not get
        called.  Plan is to remove this function once HIP supports
        std:: math function calls inside device code

    r   )r   r   )r  r  funcs      r   r5   r5     sJ     !M# \%--$qk>QRV>W=XXY;Z[\ r   z:?:?\b(__syncthreads)\b(\w*\()c                     | ddg}t        fd|D              rS dv }|dv z  }|dv z  }|t        j                        duz  }|rd| z   S )	a  If the file makes kernel builtin calls and does not include the cuda_runtime.h header,
    then automatically add an #include to match the "magic" includes provided by NVCC.
    TODO:
        Update logic to ignore cases where the cuda_runtime.h is included by another file.
    zhip/hip_runtime.hzhip/hip_runtime_api.hc              3   X   K   | ]!  }t        j                  d | d| d       # yw)z#include ("z"|<z>)N)research)r   extr  s     r   r   z#hip_header_magic.<locals>.<genexpr>   s+     
W299C5C53]C
Ws   '*hipLaunchKernelGGL
__global__
__shared__Nz#include "hip/hip_runtime.h"
)r   RE_SYNCTHREADSr/  )r  headershasDeviceLogicr  s      @r   r6   r6     s     !M #$;<G

Ww
WW *]:Nlm33Nlm33Nn++M:$FFN 8<Gr   zGextern\s+([\w\(\)]+)?\s*__shared__\s+([\w:<>\s]+)\s+(\w+)\s*\[\s*\]\s*;c                 8    | }t         j                  d |      }|S )a  Match extern __shared__ type foo[]; syntax and use HIP_DYNAMIC_SHARED() MACRO instead.
       https://github.com/ROCm-Developer-Tools/HIP/blob/master/docs/markdown/hip_kernel_language.md#__shared__
    Example:
        "extern __shared__ char smemChar[];" => "HIP_DYNAMIC_SHARED( char, smemChar)"
        "extern __shared__ unsigned char smem[];" => "HIP_DYNAMIC_SHARED( unsigned char, my_smem)"
    c                 |    d| j                  d      xs d d| j                  d       d| j                  d       dS )	NzHIP_DYNAMIC_SHARED(r   r   r   r   r   r   r   r   r   s    r   r   z'replace_extern_shared.<locals>.<lambda>  s<    )#))A,*<")=Qsyy|nBsyyYZ|n\]^ r   )RE_EXTERN_SHAREDr  )r  r  s     r   r7   r7     s(     !M$((^`moM r   c                    t         j                  j                  |       rJ |st        |       s| S t         j                  j	                  |       \  }}t         j                  j                  |      \  }}|dk(  rd}|}|}|j                  dd      }|j                  dd      }|j                  dd      }|j                  dd      }|j                  dd      }|d	k7  r|j                  dd      }|s%||k(  r t         j                  j                  |d      }|r||k(  r||z   |k(  r|d
z   }t         j                  j                  |||z         S )z3
    Returns the new name of the hipified file
    .cu.hipcudahipCUDAHIPTHCTHHzcaffe2/core_hip)rf   rg   isabsr9   rp   splitextr   r   )r   r   dirpathrR   rootr0  orig_filenameorig_dirpaths           r   r8   r8   "  s/    ww}}\***(El3GX  *ID#H e|MLoofe,Goofe,GooeU+G<<&D<<&D-||E5)G|$;'',,w.< 7TCZM<Yf}77<<,,r   c                     t         j                  j                  |       rJ | j                  d      ry| j                  d      ry| j                  d      ryy)Ntorch/Fthird_party/nvfuser/tools/autograd/templates/Trf   rg   rD  
startswithr   s    r   r9   r9   j  sP    ww}}\***x(56:;r   c                     t         j                  j                  |       rJ | j                  d      r| j                  d      ryy| j                  d      ry| j                  d      ry| j                  d      ryy)Nzaten/zaten/src/ATen/core/FTrK  rL  rM  rN  rP  s    r   r:   r:   v  ss    ww}}\***w'""#89x(56:;r   c                 >    t        |       rd| j                         v S y)NsparseFr:   lowerrP  s    r   r;   r;     s!    |$<--///r   c                     t        |       r9d| j                         v ryd| j                         v rd| j                         v ryyy)NrS  TlinalgbatchlinearalgebralibblasFrT  rP  s    r   r<   r<     sI    |$|))++++--*l.@.@.BBr   c                 
   t         j                  j                  |       rJ | j                  d      ryt         j                  j	                  |       }t         j                  j                  |      \  }}d|v xs |dv xr d|vS )Nzc10/cudaTgpur;  .cuhcudnn)rf   rg   rD  rO  basenamerE  )r   rR   r   r0  s       r   r=   r=     st    ww}}\***z*ww-HWWh'FAsX7!7VgX>UVr   c                       e Zd ZdZd Zy)TrieNodezA Trie node whose children are represented as a directory of char: TrieNode.
       A special char '' represents end of word
    c                     i | _         y rH   )childrenr"   s    r   r    zTrieNode.__init__  s	    r   N)r   r   r   r   r    r   r   r   r`  r`    s    r   r`  c                   ^    e Zd ZdZd Zd Zd Zd Zd Ze	j                  d        Zd Zd	 Zy
)r>   zCreates a Trie out of a list of words. The trie can be exported to a Regex pattern.
    The corresponding Regex should match much faster than a simple Regex union.c                     t               | _        t        j                  d      | _        | j                  j                         | _        y)z,Initialize the trie with an empty root node.F)usedforsecurityN)r`  rG  hashlibmd5_hashdigest_digestr"   s    r   r    zTrie.__init__  s/    J	[[7
zz((*r   c                 >   | j                   j                  |j                                | j                   j                         | _        | j
                  }|D ]5  }|j                  j                  |t                      |j                  |   }7 d|j                  d<   y)zAdd a word to the Trie. Tr   N)	rh  updateencoderi  rj  rG  rb  
setdefaultr`  r   wordnoder   s       r   ri   zTrie.add  sz    

$++-(zz((*yy 	'DMM$$T8:6==&D	' !br   c                     | j                   S )zReturn the root node of Trie. )rG  r"   s    r   dumpz	Trie.dump  s    yyr   c                 ,    t        j                  |      S )z Escape a char for regex. )r.  escape)r   r   s     r   quotez
Trie.quote  s    yyr   c                     | j                   }|D ]!  }||j                  v r|j                  |   }! y d|j                  v S )zZSearch whether word is present in the Trie.
        Returns True if yes, else return FalseFr   )rG  rb  ro  s       r   r/  zTrie.search  sJ     yy 	Dt}}$}}T*		 T]]""r   c                 N   |}d|j                   v r't        |j                   j                               dk(  ryg }g }d}t        |j                   j                               D ]o  }t	        |j                   |   t
              rN	 | j                  |j                   |   | j                        }|j                  | j                  |      |z          nd}q t        |      dkD   }	t        |      dkD  rIt        |      dk(  r|j                  |d          n&|j                  ddj                  |      z   dz          t        |      dk(  r|d   }
nddj                  |      z   d	z   }
|r|	r|
d
z  }
|
S d|
 d}
|
S # t        $ r$ |j                  | j                  |             Y Bw xY w)zConvert a Trie into a regular expression pattern

        Memoized on the hash digest of the trie, which is built incrementally
        during add().
        r   r   Nr   []z(?:|r   ?z)?)rb  r   keyssorted
isinstancer`  _patternrj  rt   rv  	Exceptionr   )r   rG  ri  rq  altccqr   recursecconlyr   s              r   r  zTrie._pattern  s    3t}}'9'9';#<#A4==--/0 	D$---x80"mmDMM$,?NGJJtzz$/'9: 	 X\!r7Q;2w!|

2a5!

3,s23s8q=VFSXXc]*S0F#  vhb)- ! 0IIdjj./0s   AE77)F$#F$c                 N    | j                  | j                  | j                        S z#Export the Trie to a regex pattern.r  rG  rj  r"   s    r   r   zTrie.pattern      }}TYY55r   c                 N    | j                  | j                  | j                        S r  r  r"   s    r   export_to_regexzTrie.export_to_regex  r  r   N)r   r   r   r   r    ri   rs  rv  r/  	functools	lru_cacher  r   r  r   r   r   r>   r>     sF    S+	!# ) )V66r   r>   PYTORCH_MAPr   z(?<=\W)(z)(?=\W)z#include "([^"]+)"z#include <([^>]+)>z"#define THC_GENERIC_FILE "([^"]+)"z\.cu\bc	                 b
    t         j                  j                  t         j                  j                   |            t           }	|vr%d|	_        d|	_        t        j                  |	_	        |	S t        t         j                  j                  |             }
t        d      5 }|j                         t        k(  r.d|	_        d|	_        t        j                  |	_	        |	cddd       S |j                  d       |j!                         }ddd       }t         j                  j                  t         j                  j                   t#        |
                  }t         j                  j%                  t         j                  j'                  |            s.j)                  t         j                  j'                  |             d fd}rt*        j-                  |      }n]t/        |
      rt*        j-                  ||      }n;t1        |
      rt*        j-                  |      }nd	 }t2        j-                  ||      }d# f	d	}t4        j-                   |dd
      |      }t6        j-                   |dd      |      }t8        j-                   |d      |      }|j;                  d      r:|j=                  dd      }|j=                  dd      }t>        j-                  d|      }stA        |      }|j;                  d      rd|vrtC        |      }tE        |      }ri||k(  rdt         j                  j'                        t         j                  j'                  |      k(  r%|	_        d|	_        t        j                  |	_	        |	S |k7  rtG        d      r	t        |z   }d
}t         j                  j%                  |      r)t        |d      5 }|j!                         |k7  }ddd       |rT	 j                  |dd      5 }|jI                  |       ddd       ||	_        d|	_        t        j                  |	_	        |	S ||	_        d"|	_        t        j                  |	_	        |	S # 1 sw Y   mxY w# 1 sw Y   xY w# 1 sw Y   lxY w# tJ        $ r~}tM        tN        jP                   d| d|jR                   d dtN        jT                   	tV        jX                          |	_        d!|	_        t        j                  |	_	        |	cY d}~S d}~ww xY w)$z< Executes the CUDA -> HIP conversion on the specified file. Nz[ignored, not to be hipified]zutf-8)encodingz#[ignored, input is hipified output]r   c                 2    t         | j                  d         S Nr   )r  r   ms    r   pt_replzpreprocessor.<locals>.pt_repl[  s    1771:&&r   c                 Z    t         j                  | j                  d       |             S r  )PYTORCH_SPECIAL_MAPgetr   )r  r  s    r   pt_special_replz%preprocessor.<locals>.pt_special_repl^  s"    "&&qwwqz71:>>r   c                 2    t         | j                  d         S r  )
CAFFE2_MAPr   r  s    r   c2_replzpreprocessor.<locals>.c2_replk  s    !!''!*--r   Tc                 *   	  	
 fd}|S )Nc                 N   | j                  d      }t        j                  j                  |      |j	                  d      s"|j	                  d      r;|j	                  d      s*j                  t        | j                  d                  S rt        fdD              rnd }d }rt        j                  j                        }t        j                  j                  t        j                  j                  ||            }t        j                  j                  |      r|}|}|D ]  }t        j                  j                  |      }t        j                  j                  t        j                  j                  ||            }t        j                  j                  |      s|}|} || j                  d      S |t        vrt        |	       n|t        v rt        |   }|j                  t        j                   k(  rt        j                  j#                  |      }t        j                  j                  t        j                  j                  t        |                  }	|	|_        |t        |<   j                  t        j                  j#                  |	|	|            S ||            S t        |   j$                  }
j                  t        j                  j#                  |
|
|            S ||            S | j                  d      S )Nr   )z	ATen/cudazATen/native/cudazATen/native/nested/cudazATen/native/quantized/cudazATen/native/sparse/cudazATen/native/transformers/cudazTHC/rA  THCPc              3   @   K   | ]  }|j                          y wrH   r   )r   srR   s     r   r   z>preprocessor.<locals>.mk_repl.<locals>.repl.<locals>.<genexpr>  s     ,UaQZZ-A,Ur   r   )r   rf   rg   r^  rO  formatr8   r   dirnamerj   r   rh   r$   r.   r   r   r   r   r   )r  r   
header_dirheader_filepathheader_dir_to_checkheader_path_to_checkheader_include_dirheader_resultheader_rel_pathheader_fout_pathhipified_header_filepathrR   r   r   r   r   r   include_current_dirr   r   r   r   templs              @r   replz+preprocessor.<locals>.mk_repl.<locals>.replq  s   
Aww''*H & ' e$Q\\&-A||$5aggajBV$WXX$,U9,U)U!
"&&*,''//(*C'+-77??277<<H[]^;_+`(ww~~&:;%8
*>"*.A C*.0ggll;KM_.`+/1wwrww||L_ab?c/d,77>>*>?)<J.BOC #*771:%"*==34D4C4=?RTY[k4H)Ubd %(;;$7$HM$22l6N6NN*,''///K[*\+-77??277<<HXHYZik  IA<B ,C(6F3?L+O<$||BGGOOP`Pl<LR\-^  _ _APR\-^  _ _+>+O+]+](||BGGOOPhPt4LJT%V W W9H*%V W W 771:r   r   )r  r  r  r   r   r   r   r   r   r   r   r   s   `` r   mk_replzpreprocessor.<locals>.mk_replp  s    9	 9	t r   z#include "{0}"z#include <{0}>Fz#define THC_GENERIC_FILE "{0}"zCMakeLists.txtr?  r@  rA  rB  r<  r[  	PowKernelz[skipped, no changes])r;  r\  .c.cc.cpp.h.hppwz[ok]zFailed to save z with "z", leaving z unchanged.filez[skipped, no permissions]z[skipped, already hipified])T)-rf   rg   rj   r   r$   r   r   r   r   r   r   r   rQ   readlineHIPIFY_C_BREADCRUMBseekreadr8   rh   r  rq   RE_PYTORCH_PREPROCESSORr  r<   r:   RE_CAFFE2_PREPROCESSORRE_QUOTE_HEADERRE_ANGLE_HEADERRE_THC_GENERIC_FILEr   r   RE_CU_SUFFIXr1   r5   r6   r,   writePermissionErrorr   r*   rX   strerrorrZ   sysstderr)r   r   r   r   r   r   r   r   r   r   r   finoutput_sourceorig_output_source	fout_pathr  r  r  do_writefout_oldfoutr   r   r  s   ` ```````             @@r   r?   r?   5  sd    wwrww||,<hGHH'1My &*#>&2&7&7# ;K!LML	h	) #S<<>00*.M'#HM *6*;*;M' # # 	
# ' -=?PQ]_s?t uvI77>>"''//)45277??956'?
 /33G]K<(377WM\*377OM.266wNM; ;x $''0@$(GWM#''0@%(H-XM'++G4T,UWdeM )*%--fe<%--eU;$((? -mUC 	/*80K.}= %]3M 	-/GGOOH%)CC&.#6&2&7&7# 9!1(<n!o+m;H	ww~~i )g. 	8(}}-7H	8	!	3A *T

=)**3M'#)M *6*;*;M'   '0#<&2&7&7#C# #X	8 	8* *  	!W__%_YKwqzzlR]^f]ggrszss  sA  Bzz#*2M'#>M *6*;*;M'  	!sU   0<R6!R+R
R' R0,R' RRR$ R' '	T.0A3T)#T.)T.c                 X   t        | d      5 }|j                         }|r2t        j                  dt        j                  |       dfd|      }n|j                  |      }|j                  d       |j                  |       |j                          d d d        y # 1 sw Y   y xY w)Nr+z\b(z)\bc                     S rH   r   )r
  replace_strings    r   r   z+file_specific_replacement.<locals>.<lambda>  s    n r   r   )	r)   r  r.  r  ru  r   r  r  truncate)r   search_stringr  strictr   contentss     `   r   r@   r@     s    	x	 !668vvRYY}%=$>cBD\^fgH''~FH	q			

  s   B	B  B)c                    t        | d      5 }|j                         }|d   dk7  r|d   dk7  rd| d}d| d|z   }|j                  d       |j                  |       |j	                          d d d        y # 1 sw Y   y xY w)	Nr  r   r   ry   r   r  z	#include z 
)r)   r  r  r  r  )r   headerr   r  s       r   rA   rA     s    	x	 !668!9r
c 1]Fxs+x7	q			

  s   A"A88Bc                 *    | j                  dd      } | S )z<Static global kernels in HIP results in a compilation error.z __global__ staticr2  )r   )in_txts    r   rB   rB     s    ^^0,?FMr   z#include .*\nc                    g }ddd}| }|dz   }|t        |      k  r||   dk(  r|dxx   dz  cc<   nT||   dk(  r|dxx   dz  cc<   n>||   dk(  r|dxx   dz  cc<   n(||   dk(  r ||dz
     dk7  r|d   dkD  r|dxx   dz  cc<   |d   dk(  r|d   dk(  r|j                  ||d	       	 |S |d   dk(  r)|d   dk(  r!||   d
k(  r|j                  ||d	       |dz   }|dz  }|t        |      k  r|S )ad   Return the list of arguments in the upcoming function parameter closure.
        Example:
        string (input): '(blocks, threads, 0, THCState_getCurrentStream(state))'
        arguments (output):
            '[{'start': 1, 'end': 7},
            {'start': 8, 'end': 16},
            {'start': 17, 'end': 19},
            {'start': 20, 'end': 53}]'
    r   )r   r   r   r   r   r   r   -r   r   )r   rt   )r   r   	argumentsclosurescurrent_positionargument_start_poss         r   rC   rC     sj    IH )A- S[
("#s*SMQM$%,SMQM$%,SMQM$%,8H18L1MQT1TYabeYfijYjSMQM C=A(3-1"4'9BRST  C=A(3-1"4@P9QUX9X'9BRST!1A!5A+ S[
(. r   c                 x    | j                         dv ry| j                         dv ryt        j                  d      )zArgumentParser doesn't support type=bool. Thus, this helper method will convert
    from possible string types to True / False.)yestruety1T)nofalser   rw   0FzBoolean value expected.)rU  argparseArgumentTypeError)vs    r   rD   rD   ;  s:     	wwy22	
4	4(()BCCr   project_directoryshow_detailedheader_extensionsextra_fileshipify_extra_files_onlyc                 d  	 | dk(  rt        j                         } t         j                  j                  |       s t	        d       t        j                  d       |s| j                  d       | dz   }| |k7  r@D cg c]  }|j                  | |       c}	D cg c]  }|j                  | |       c}	t         j                  j                  |      st        j                  | |       t        t        t                    t        t        t        	            	t        t        |	|||            }t        |      }|D ]W  }t         j                  j!                  |      s t         j                  j#                  ||      }||vsG|j%                  |       Y ddlm} |D ]{  }t         j                  j!                  |      r	 ||      }n& |t         j                  j#                  ||            }|j+                  	fd	|j-                  d
      D               } |t/        d      }g g d}|s|n|D ]  }t1        |||||||||
	        t	        t2        j4                  dz   t2        j6                  z   t
        j8                         |rt;        |       t<        S c c}w c c}w )Nr   z,The project folder specified does not exist.r   r   _amd)r   r   r   r   r   r   )Pathc              3      K   | ]`  }|j                         st        t        |            r8t        t        |            s#t        |j                        rt        |       b y wrH   )is_filer   strr,   name)r   rg   r  r   r   s     r   r   zhipify.<locals>.<genexpr>  sP      
TH-c$i1 ,=> I
s   A)AA)r  T)r_   )r   r   z-Successfully preprocessed all matching files.r  )rf   getcwdrg   rh   r   r  exitrstripr   shutilcopytreer  mapr   r-   r`   rD  r   rt   pathlibr  extendrglobr+   r.   r*   rW   rZ   r  r/   r$   )r  r  r   r  r   r   r   r  r   r   r   r   r   r  r   includerO   r   all_files_setr   r  r  header_include_dir_pathr   r   s      `  `  `               r   rE   rE   F  sk   " BIIK 77>>+,<=   %,v5,,X`aWGOO$57GHaU\]66>>"35EF] 77>>*+)+;<Cx01H3}g./G'(8807J:K=QS TI 	NM  ww}}Q-q1AM!Q	  1 

77==+,&*+=&>#&*277<<8HJ\+]&^# 
"9"?"?"D
 	


 (DA	 46"ME&=Y; q'(8(IOb(-/?AUW`bo	qq 
'//K
Kgll
Zadakakl eg b]s   =J(J-)r   r   r   FFr   )F)r;  r\  r  r  r  r  z.inr  )r\  r  r  r   r   )r  r   Fr   TFFFN)cr   r  r   r.  r  r  rf   r   r   cuda_to_hip_mappingsr   r   typingr   collections.abcr   r	   r
   enumr   r  rf  r   r   dictr  HipifyFinalResultr  r$   __annotations__PYTORCH_TEMPLATE_MAP__all__r  r(   r)   r*   r+   r   boolr,   r   r-   r  r.   r/   r0   compiler  r1   r2   r3   r4   	RE_ASSERTr5   r4  r6   r9  r7   r8   r9   r:   r;   r<   r=   r`  r>   CAFFE2_TRIEr  PYTORCH_TRIEr  objectr  mappingr  itemssrcr}   dst	meta_data
API_CAFFE2ri   API_SPECIALr  API_PYTORCHr  r  r  r  r  r  r  r?   r@   rA   rB   
RE_INCLUDErC   rD   rE   r   r   r   <module>r     sz  0   	  
 	  6 5  $ -   4 D D l*+ T )+ & +!+*= s. .1
 & D% % %9s 9 9T 9
K  !"'%*))) ) 	)
  ) #) 08})X+++ + &	+
 CI+ + #+ (+ + !%+2
\ F 2::>? Wt#LE
E
 BJJ()	  =>: 2::hi E-PW \6 \6| f
v!#T#v+ #  # "Ggw'''mmo "
UAh!"I	y0S! $$	1kooc26N+.#C(#&C   	1i6K6KS\6\OOC !JsO""  $K$?$?$AB $"**1M1M1O0PPW%XY "**23"**23 bjj!FG rzz)$vvv v &	v
 CIv v #v (v v !-vp	 RZZ()
+\D  T"8$&#"!&$)04RRR R  	R
 R "R R R R R R R R "R ,-R  !Rr   