o
    wZh                  !   @   s  U d Z ddlZddlZddlZddlZddlZddlZddlmZ ddl	m
Z
 ddl	mZ ddlmZ ddlmZ dd	lmZmZ dd
lmZ ddlZddlZG dd deZG dd dZeeef ZdZi Zeed< 	 dddZg dZG dd de Z!dd Z"G dd dZ#G dd dZ$dedefddZ%d ed!ede&fd"d#Z'd$d% Z(	&	&	&	'	'dd(ed)ed*ed!ed+e&d,e&dee fd-d.Z)d/ed0ed1ed2ed3eee*f d4e&d,e&d5e$d6e&ddfd7d8Z+d9d: Z,d;d< Z-e.d=Z/d>d? Z0d@dA Z1dBdC Z2dDdE Z3e.dFZ4dGdH Z5e.dIZ6dJdK Z7e.dLZ8dMdN Z9ddOdPZ:dQdR Z;dSdT Z<dUdV Z=dWdX Z>dYdZ Z?G d[d\ d\Z@G d]d^ d^ZAeA ZBi ZCeA ZDi ZEeeeFf ed_< i ZGe
D ]UZHeIeHes_J eHJ D ]E\ZKZLeLd ZMeLdd ZNejOeNvreDPeK ejQeNv reEReKd`reMeGeK< neMeEeK< ejSeNvrejQeNvreBPeK eMeCeK< qcqUe.eBT ZUe.daeDT  dbZVe.dcZWe.ddZXe.deZYe.dfZZ	 d/ed0ed1ed2ed3eee*f d4e&d,e&d5e$d6e&defdgdhZ[ddidjZ\dkdl Z]dmdn Z^e.doZ_dpdq Z`drds Za	'	t	u	`	&	v	&	'	&	w	'	'	'	ddxedye&d!edzed/ed2ed)ed{ed+e&d*ed6e&d4e&d,e&d|e&d5ee$ def d}d~ZbdS )a   The Python Hipify script.
##
# Copyright (c) 2015-2016 Advanced Micro Devices, Inc. All rights reserved.
#               2017-2018 Advanced Micro Devices, Inc. and
#                         Facebook Inc. All rights reserved.
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
# THE SOFTWARE.
    N   )	constants)CUDA_TO_HIP_MAPPINGS)MATH_TRANSPILATIONS)Optional)Iterator)MappingIterable)Enumc                   @   s   e Zd ZdZdZdS )CurrentStater      N)__name__
__module____qualname__INITIALIZEDDONE r   r   O/var/www/auris/lib/python3.10/site-packages/torch/utils/hipify/hipify_python.pyr   -   s    r   c                   @   s   e Zd Zdd Zdd ZdS )HipifyResultc                 C   s   || _ || _d| _d S )N current_statehipified_pathstatus)selfr   r   r   r   r   __init__2   s   
zHipifyResult.__init__c                 C   s   d| j  d| j d| j S )NzHipifyResult:: current_state: z, hipified_path : z
, status: r   r   r   r   r   __str__7   s   zHipifyResult.__str__N)r   r   r   r   r   r   r   r   r   r   1   s    r   z;// !!! This is a file automatically generated by hipify!!!
HIPIFY_FINAL_RESULTZscalar_t)ZDtypeT)!
InputErroropenfbcolorsGeneratedFileCleanermatch_extensionsmatched_files_iterpreprocess_file_and_save_resultcompute_statsadd_dim3processKernelLaunchesfind_closure_groupfind_bracket_groupfind_parentheses_groupreplace_math_functionship_header_magicreplace_extern_sharedget_hip_file_pathis_out_of_placeis_pytorch_fileis_cusparse_fileis_special_fileis_caffe2_gpu_filer5   Triepreprocessorfile_specific_replacementfile_add_headerfix_static_global_kernelsextract_argumentsstr2boolr   r   hipifyc                       s$   e Zd Z fddZdd Z  ZS )r    c                    s   t  | || _d S N)superr   message)r   r@   	__class__r   r   r   N   s   
zInputError.__init__c                 C   s   d| j  S )NzInput error: )r@   r   r   r   r   r   R   s   zInputError.__str__)r   r   r   r   r   __classcell__r   r   rA   r   r    K   s    r    c                 C   s   t | |ddS )Nignore)errors)open)filenamemoder   r   r   r!   V      r!   c                   @   s,   e Zd ZdZdZdZdZdZdZdZ	dZ
d	S )
r"   z[95mz[94mz[92mz[93mz[91mz[0mz[1mz[4mN)r   r   r   HEADERZOKBLUEOKGREENWARNINGFAILENDCZBOLDZ	UNDERLINEr   r   r   r   r"   [   s    r"   c                   @   s<   e Zd ZdZdddZdd Zdd Zdd	d
Zdd ZdS )r#   z+Context Manager to clean up generated filesFc                 C   s   || _ t | _g | _d S r>   )keep_intermediatessetfiles_to_cleandirs_to_clean)r   rO   r   r   r   r   p   s   
zGeneratedFileCleaner.__init__c                 C   s   | S r>   r   r   r   r   r   	__enter__u   s   zGeneratedFileCleaner.__enter__c                 O   s6   t j|s| jt j| t|g|R i |S r>   )ospathexistsrQ   addabspathrF   )r   fnargskwargsr   r   r   rF   x   s   zGeneratedFileCleaner.openc                 C   s|   t j|\}}|st j|\}}|r#|r#t j|s#| j|dd t j|r+|s<t | | jt j	| d S d S )NT)exist_ok)
rT   rU   splitrV   makedirsisdirmkdirrR   appendrX   )r   dnr\   parentnr   r   r   r^   }   s   
zGeneratedFileCleaner.makedirsc                 C   sD   | j s| jD ]}t| q| jd d d D ]	}t| qd S d S )N)rO   rQ   rT   unlinkrR   rmdir)r   typevalue	tracebackfdr   r   r   __exit__   s   
zGeneratedFileCleaner.__exit__NF)	r   r   r   __doc__r   rS   rF   r^   rm   r   r   r   r   r#   n   s    


r#   rU   returnc                 C   s   |  tjdS )N/)replacerT   sep)rU   r   r   r   _to_unix_path   rI   rt   rG   
extensionsc                       t  fdd|D S )z<Helper method to see if filename ends with certain extensionc                 3   s    | ]}  |V  qd S r>   endswith).0erG   r   r   	<genexpr>       z#match_extensions.<locals>.<genexpr>any)rG   ru   r   r{   r   r$         r$   c                    rv   )Nc                 3   s    | ]	}t   |V  qd S r>   )fnmatch)ry   patternfilepathr   r   r|      s    z_fnmatch.<locals>.<genexpr>r~   )r   patternsr   r   r   _fnmatch   s   r   r   F	root_pathincludesignoresout_of_place_onlyis_pytorch_extensionc                 c   s    t |}tj| ddD ]o\}}}	tj|| }
|
dkr<d|v r%|d d|v r.|d d|v r<|d |d |	D ]<}ttj||}ttj|
|}t	||rzt	||szt
||se||v rz|swt|spt|spq>|rwt|swq>|V  q>qd S )NT)topdown.z.gitbuildZthird_partyzthird_party/nvfuser)rP   rT   walkrU   relpathremovera   rt   joinr   r$   r2   r5   r1   )r   r   r   ru   r   r   Zexact_matchesZabs_dirpathdirs	filenamesZrel_dirpathrG   r   rel_filepathr   r   r   r%      s>   



r%   output_directoryr   	all_filesheader_include_dirsstatship_clang_launch	clean_ctxshow_progressc	              
   C   st   t jt j| |}	ttj|	d}
|
t|	< t| ||||||||	}|r4d|j	vr4t
|	d|j|j	dd |t|	< d S )N)r   r   Zignoredz->T)flush)rT   rU   rX   r   r   r   r   r   r7   r   printr   )r   r   r   r   r   r   r   r   r   fin_pathhipify_resultresultr   r   r   r&      s   

r&   c                 C   sP   dd | d D }t dt|d t d| t dt| d d d S )	Nc                 S   s   h | ]\}}|qS r   r   )ry   Z	cuda_callZ	_filepathr   r   r   	<setcomp>   s    z compute_stats.<locals>.<setcomp>unsupported_callsz1Total number of unsupported CUDA function calls: rl   , z+
Total number of replaced kernel launches: kernel_launches)r   lenr   )r   r   r   r   r   r'      s   r'   c                 C   s  d}d}|  dd dd} dd tdD }d|| d< t| D ]E\}}|d	kr+ n<|d
kr4|d	7 }n|dkr<|d	8 }|dksH|t| d	 krf|dkrf||dk || d< |d	7 }|dk rf|d	 || d< q!| |d d |d d d	  }| |d	 d |d	 d  }| |d d |d d   ddd}	| |d	 d |d	 d   ddd}
d|	 d}d|
 d}| |	|}| |
|}| || || }|S )zBadds dim3() to the second and third arguments in the kernel launchr   <<<r   >>>c                 S   s   g | ]}i qS r   r   )ry   _r   r   r   
<listcomp>   s    zadd_dim3.<locals>.<listcomp>r   startr   (),end
 zdim3()rr   range	enumerater   strip)kernel_stringcuda_kernelcountclosureZarg_locsindcZfirst_arg_rawZsecond_arg_rawZfirst_arg_cleanZsecond_arg_cleanZfirst_arg_dim3Zsecond_arg_dim3Zfirst_arg_raw_dim3Zsecond_arg_raw_dim3r   r   r   r(      s8   
  **r(   z([ ]+)(detail?)::[ ]+\\\n[ ]+c                    sT  t dd    fdd}dd }dd }t|| } }|D ]}||} d	|d
 }	 |d d |	d  }
 |d |d
  }|d d
 dkrPdnd} |d d || d
 d  }t||
}ttd|d dd	dd}d|dd ddd|  d dddd|d	| d  }||
|}|d | q"|S )zK Replace the CUDA style Kernel launches with the HIP style kernel launches.c                 S   s   |  d |  d dS )Nr   r   z::groupinpr   r   r   <lambda>  s    z'processKernelLaunches.<locals>.<lambda>c           
         sz  | d | d dddddddd}ddi}d}d}d	}d
}|}t |d d d ddD ]} | }	|||fv ro|	dkrQ||krI|}||d d< |d  d7  < |	dkro|d  d8  < |d dkro||kro||d d< |}||kr |  s | dv r||kr|}||d d< |dkrd|d d< |d |d |d g  S q-||kr||d d< |d |d |d g  S q-d S )Nr   r   r   r   re   )kernel_launchkernel_nametemplatez<>r   r   r      r   >r   <>   r   #:r   r   r   )r   isalnum)
Z	in_kernelposr   STARTZAT_TEMPLATEZAFTER_TEMPLATEZAT_KERNEL_NAMEr   icharstringr   r   grab_method_and_template  sJ   z7processKernelLaunches.<locals>.grab_method_and_templatec                 S   sr   d}g }|  d|dkr7|  d|}|  d|d }|dkr"td|||| || d |  d|dks|S )zKFinds the starting and ending points for all kernel launches in the string.r   r   re   r   r   zno kernel end found)r   r   r   )findr    ra   )r   Z
kernel_endZkernel_positionsZkernel_startr   r   r   find_kernel_boundsT  s   
z1processKernelLaunches.<locals>.find_kernel_boundsc                 S   s   d}d}d}| D ]f}|dkr3|dkr|dkrd}nF|dkr$|dkr$d}n;|dkr2|dkr2|dkr2d}n,|dkrB|d	ks?|d
krAd}n|dkrQ|dkrP|dkrPd}n|dkr_|dkr_|dkr_d}|}|dkrj||7 }q|d7 }q|S )Nr   rq   z//*z/*"\'r   xr   )r   Z
in_commentZprev_cZ
new_stringr   r   r   r   mask_commentsl  s8   

z,processKernelLaunches.<locals>.mask_commentsr   r   r   r   r   re   r   r   r   r   zhipLaunchKernelGGL(z, 0   r   r   )	RE_KERNEL_LAUNCHsublistr   r(   r   r;   rr   ra   )r   r   r   r   r   Zget_kernel_positionsoutput_stringZkernelparamsZparenthesisr   r   Zend_param_indexZkernel_name_with_templateZcuda_kernel_dim3Znum_klpZ
hip_kernelr   r   r   r)     s4   ;! 
"
r)   c                 C   s   d}d}|}d\}}|t | k rJ| | |d kr(|du r#d}d}|}n|d7 }n| | |d kr@|r@|d8 }|dkr@|}||fS |d7 }|t | k sdS )a  Generalization for finding a balancing closure group

         if group = ["(", ")"], then finds the first balanced parentheses.
         if group = ["{", "}"], then finds the first balanced bracket.

    Given an input string, a starting position in the input string, and the group type,
    find_closure_group returns the positions of group[0] and group[1] as a tuple.

    Example:
        >>> find_closure_group("(hi)", 0, ["(", ")"])
        (0, 3)
    Fr   )re   re   Tr   )NN)r   )input_stringr   r   Zinside_parenthesisparensr   Zp_startZp_endr   r   r   r*     s&   
r*   c                 C      t | |ddgdS )z%Finds the first balanced parantheses.{}r   r*   r   r   r   r   r   r+        r+   c                 C   r   )z!Finds the first balanced bracket.r   r   r   r   r   r   r   r   r,     r   r,   z\bassert[ ]*\(c                 C   s.   | }t D ]}|| dt |  d}q|S )a  FIXME: Temporarily replace std:: invocations of math functions
        with non-std:: versions to prevent linker errors NOTE: This
        can lead to correctness issues when running tests, since the
        correct version of the math function (exp/expf) might not get
        called.  Plan is to remove this function once HIP supports
        std:: math function calls inside device code

    r   )r   rr   )r   r   funcr   r   r   r-     s   	r-   z:?:?\b(__syncthreads)\b(\w*\()c                    sh   |  ddg}t  fdd|D r S d v }|d v 7 }|d v 7 }|t du7 }|r2d	|    S )
a  If the file makes kernel builtin calls and does not include the cuda_runtime.h header,
    then automatically add an #include to match the "magic" includes provided by NVCC.
    TODO:
        Update logic to ignore cases where the cuda_runtime.h is included by another file.
    zhip/hip_runtime.hzhip/hip_runtime_api.hc                 3   s*    | ]}t d | d| d V  qdS )z#include ("z"|<z>)N)research)ry   extr   r   r   r|      s   ( z#hip_header_magic.<locals>.<genexpr>ZhipLaunchKernelGGL
__global__Z
__shared__Nz#include "hip/hip_runtime.h"
)r   RE_SYNCTHREADSr   )r   headersZhasDeviceLogicr   r   r   r.     s   r.   zGextern\s+([\w\(\)]+)?\s*__shared__\s+([\w:<>\s]+)\s+(\w+)\s*\[\s*\]\s*;c                 C   s   | }t dd |}|S )a  Match extern __shared__ type foo[]; syntax and use HIP_DYNAMIC_SHARED() MACRO instead.
       https://github.com/ROCm-Developer-Tools/HIP/blob/master/docs/markdown/hip_kernel_language.md#__shared__
    Example:
        "extern __shared__ char smemChar[];" => "HIP_DYNAMIC_SHARED( char, smemChar)"
        "extern __shared__ unsigned char smem[];" => "HIP_DYNAMIC_SHARED( unsigned char, my_smem)"
    c                 S   s.   d|  dpd d|  d d|  d dS )	NzHIP_DYNAMIC_SHARED(r   r   r   r   r   r   r   r   r   r   r   r   r     s   . z'replace_extern_shared.<locals>.<lambda>)RE_EXTERN_SHAREDr   )r   r   r   r   r   r/     s
   r/   c                 C   s   t j| rJ |st| s| S t j| \}}t j|\}}|dkr&d}|}|}|dd}|dd}|dd}|dd}|dd}|d	krR|dd}|s_||kr_t j|d}|ro||kro|| |kro|d
 }t j||| S )z3
    Returns the new name of the hipified file
    .cu.hipcudaZhipCUDAHIPTHCTHHzcaffe2/coreZ_hip)rT   rU   isabsr1   r]   splitextrr   r   )r   r   dirpathrG   rootr   orig_filenameZorig_dirpathr   r   r   r0   "  s*   $r0   c                 C   s>   t j| rJ | drdS | drdS | drdS dS )Ntorch/Fthird_party/nvfuser/tools/autograd/templates/TrT   rU   r   
startswithr   r   r   r   r1   j  s   


r1   c                 C   sZ   t j| rJ | dr| drdS dS | drdS | dr$dS | dr+dS dS )Nzaten/zaten/src/ATen/core/FTr   r   r   r   r  r   r   r   r2   v  s   




r2   c                 C   s   t | r
d|  v S dS )NsparseFr2   lowerr  r   r   r   r3     s   r3   c                 C   s<   t | rd|  v rdS d|  v rd|  v rdS dS dS )Nr  TZlinalgZbatchlinearalgebralibblasFr  r  r   r   r   r4     s   r4   c                 C   sR   t j| rJ | drdS t j| }t j|\}}d|v s%|dv o(d|vS )Nzc10/cudaTZgpur   .cuhZcudnn)rT   rU   r   r  basenamer   )r   rG   r   r   r   r   r   r5     s   
r5   c                   @   s   e Zd ZdZdd ZdS )TrieNodezA Trie node whose children are represented as a directory of char: TrieNode.
       A special char '' represents end of word
    c                 C   s
   i | _ d S r>   )childrenr   r   r   r   r     s   
zTrieNode.__init__N)r   r   r   ro   r   r   r   r   r   r	    s    r	  c                   @   sV   e Zd ZdZdd Zdd Zdd Zdd	 Zd
d Ze	j
dd Zdd Zdd ZdS )r6   zCreates a Trie out of a list of words. The trie can be exported to a Regex pattern.
    The corresponding Regex should match much faster than a simple Regex union.c                 C   s&   t  | _tjdd| _| j | _dS )z,Initialize the trie with an empty root node.F)usedforsecurityN)r	  r   hashlibmd5_hashdigest_digestr   r   r   r   r     s   zTrie.__init__c                 C   sT   | j |  | j  | _| j}|D ]}|j|t  |j| }qd|jd< dS )zAdd a word to the Trie. Tr   N)	r  updateencoder  r  r   r
  
setdefaultr	  r   wordnoder   r   r   r   rW     s   zTrie.addc                 C   s   | j S )zReturn the root node of Trie. )r   r   r   r   r   dump  s   z	Trie.dumpc                 C   s
   t |S )z Escape a char for regex. )r   escape)r   r   r   r   r   quote  s   
z
Trie.quotec                 C   s4   | j }|D ]}||jv r|j| }q dS d|jv S )zZSearch whether word is present in the Trie.
        Returns True if yes, else return FalseFr   )r   r
  r  r   r   r   r     s   

zTrie.searchc              	   C   sB  |}d|j v rt|j  dkrdS g }g }d}t|j  D ]4}t|j | trQz| |j | | j}|| 	||  W q t
yP   || 	| Y qw d}qt|dk }	t|dkr{t|dkro||d  n|dd| d  t|dkr|d }
n	dd| d	 }
|r|	r|
d
7 }
|
S d|
 d}
|
S )zConvert a Trie into a regular expression pattern

        Memoized on the hash digest of the trie, which is built incrementally
        during add().
        r   r   Nr   []z(?:|r   ?z)?)r
  r   keyssorted
isinstancer	  _patternr  ra   r  	Exceptionr   )r   r   r  r  Zaltccqr   recurseZcconlyr   r   r   r   r!    s:   
zTrie._patternc                 C      |  | j| jS z#Export the Trie to a regex pattern.r!  r   r  r   r   r   r   r        zTrie.patternc                 C   r&  r'  r(  r   r   r   r   export_to_regex  r)  zTrie.export_to_regexN)r   r   r   ro   r   rW   r  r  r   	functools	lru_cacher!  r   r*  r   r   r   r   r6     s    
+r6   PYTORCH_MAPr   z(?<=\W)(z)(?=\W)z#include "([^"]+)"z#include <([^>]+)>z"#define THC_GENERIC_FILE "([^"]+)"z\.cu\bc	                    s  t jt j|t }	| vrd|	_d|	_tj|	_	|	S t
t j|}
tdd*}| tkrHd|	_d|	_tj|	_	|	W  d   S |d | }W d   n1 s[w   Y  |}t jt jt|
}t jt j|st j| dd fd	d
}rt|}n t|
rt||}nt|
rt|}n
dd }t||}d' 	f	dd	}t|dd|}t|dd|}t|d|}|dr|dd}|dd}td|}st |	}|drd|vrt!|}t"|}r1||kr1t jt j|kr1|	_d|	_tj|	_	|	S |kr@t#dr@t| }d}t j|rft|dd}| |k}W d   n	1 saw   Y  |rz+j|ddd}|$| W d   n	1 sw   Y  ||	_d|	_tj|	_	|	W S  t%y } z*t&t'j( d | d!|j) d" d#t'j* 	t+j,d$ |	_d%|	_tj|	_	|	W  Y d}~S d}~ww ||	_d&|	_tj|	_	|	S )(z< Executes the CUDA -> HIP conversion on the specified file. Nz[ignored, not to be hipified]zutf-8)encodingz#[ignored, input is hipified output]r   c                 S      t | d S Nr   )r-  r   mr   r   r   pt_repl[  rI   zpreprocessor.<locals>.pt_replc                    s   t | d | S r0  )PYTORCH_SPECIAL_MAPgetr   r1  )r3  r   r   pt_special_repl^  r   z%preprocessor.<locals>.pt_special_replc                 S   r/  r0  )
CAFFE2_MAPr   r1  r   r   r   c2_replk  rI   zpreprocessor.<locals>.c2_replTc                    s$    	
fdd}|S )Nc              
      s  |  d}tj| |ds|dr%|ds%t|  dS rt fddD rd }d }rStj}tj	tj
||}tj|rS|}|}|d u rxD ]}tj
|}tj	tj
||}tj|rw|}|}qY|d u r|  dS |tvrt|
		 n=|tv rt| }|jtjkrtj|}tj	tj
t|}	|	|_|t|< tj|	d ur|	|S ||S t| j}
tj|
d ur|
|S ||S |  dS )Nr   )z	ATen/cudazATen/native/cudazATen/native/nested/cudazATen/native/quantized/cudazATen/native/sparse/cudazATen/native/transformers/cudazTHC/r   ZTHCPc                 3   s    | ]}|  V  qd S r>   rw   )ry   sr{   r   r   r|     r}   z>preprocessor.<locals>.mk_repl.<locals>.repl.<locals>.<genexpr>r   )r   rT   rU   r  r  formatr0   r   dirnamerX   r   rV   r   r&   r   r   r   r   r   )r2  rk   
header_dirZheader_filepathZheader_dir_to_checkZheader_path_to_checkheader_include_dirZheader_resultZheader_rel_pathZheader_fout_pathZhipified_header_filepath)r   r   r   r   r   include_current_dirr   r   r   r   templr{   r   replq  sn   




z+preprocessor.<locals>.mk_repl.<locals>.replr   )r?  r>  r@  )	r   r   r   r   r   r   r   r   r   )r>  r?  r   mk_replp  s    :zpreprocessor.<locals>.mk_replz#include "{0}"z#include <{0}>Fz#define THC_GENERIC_FILE "{0}"zCMakeLists.txtr   r   r   r   r   r  Z	PowKernelz[skipped, no changes])r   r  .c.cc.cpp.h.hppwz[ok]zFailed to save z with "z", leaving z unchanged.filez[skipped, no permissions]z[skipped, already hipified])T)-rT   rU   rX   r   r   r   r   r   r   r   rt   r   rF   readlineHIPIFY_C_BREADCRUMBseekreadr0   rV   r;  r^   RE_PYTORCH_PREPROCESSORr   r4   r2   RE_CAFFE2_PREPROCESSORRE_QUOTE_HEADERRE_ANGLE_HEADERRE_THC_GENERIC_FILErx   rr   RE_CU_SUFFIXr)   r-   r.   r$   writePermissionErrorr   r"   rL   strerrorrN   sysstderr)r   r   r   r   r   r   r   r   r   r   r   ZfinZoutput_sourceZorig_output_sourceZ	fout_pathr6  r8  rA  Zdo_writeZfout_oldZfoutrz   r   )
r   r   r   r   r   r   r   r3  r   r   r   r7   5  s   

	<


&r7   c                    s   t | d6}| }|rtdt| d fdd|}n|| }|d || |  W d    d S 1 s>w   Y  d S )Nr+z\b(z)\bc                    s    S r>   r   )r   replace_stringr   r   r     s    z+file_specific_replacement.<locals>.<lambda>r   )	r!   rM  r   r   r  rr   rL  rT  truncate)r   search_stringr[  strictrk   contentsr   rZ  r   r8     s   &


"r8   c                 C   s   t | d5}| }|d dkr|d dkrd| d}d| d| }|d || |  W d    d S 1 s=w   Y  d S )	NrY  r   r   re   r   r   z	#include z 
)r!   rM  rL  rT  r\  )r   headerrk   r_  r   r   r   r9     s   


"r9   c                 C   s   |  dd} | S )z<Static global kernels in HIP results in a compilation error.z __global__ staticr   rr   )Zin_txtr   r   r   r:     s   r:   z#include .*\nc                 C   s:  g }ddd}| }|d }|t |k r|| dkr"|d  d7  < n:|| dkr1|d  d8  < n+|| dkr@|d  d7  < n|| dkr\||d  dkr\|d dkr\|d  d8  < |d dkrs|d dkrs|||d	 	 |S |d dkr|d dkr|| d
kr|||d	 |d }|d7 }|t |k s|S )ad   Return the list of arguments in the upcoming function parameter closure.
        Example:
        string (input): '(blocks, threads, 0, THCState_getCurrentStream(state))'
        arguments (output):
            '[{'start': 1, 'end': 7},
            {'start': 8, 'end': 16},
            {'start': 17, 'end': 19},
            {'start': 20, 'end': 53}]'
    r   )r   r   r   r   r   r   r   -r   r   )r   ra   )r   r   	argumentsZclosurescurrent_positionZargument_start_posr   r   r   r;     s2   (	$r;   c                 C   s*   |   dv rdS |   dv rdS td)zArgumentParser doesn't support type=bool. Thus, this helper method will convert
    from possible string types to True / False.)yestruety1T)nofalserk   rd   0FzBoolean value expected.)r  argparseArgumentTypeError)vr   r   r   r<   ;  s
   
r<   r   r  rB  rC  rD  rE  z.inrF  r  rE  rF  r   Tproject_directoryshow_detailedheader_extensionsextra_fileshipify_extra_files_onlyc                    s  dkrt  t jstd td s"d d kr:fddD fddD t jsFt	 t
ttt
ttt
t|||d	}t|}|D ]}t j|sut j|}||vr~|| qfd
dlm} |D ]'}t j|r||}n	|t j|}| fdd|dD  q|d u rtdd}g g d}|s|n|D ]}t||||||||
	 qttjd tj tjd |rt| tS )Nr   z,The project folder specified does not exist.r   rq   Z_amdc                       g | ]}|  qS r   ra  )ry   includer   rs  r   r   r   e      zhipify.<locals>.<listcomp>c                    rx  r   ra  )ry   rD   rz  r   r   r   f  r{  )r   r   ru   r   r   r   )Pathc                 3   sH    | ]}|  rtt|rtt|st|j rt|V  qd S r>   )is_filer   strr$   name)ry   rU   )ru  r   r   r   r   r|     s    

zhipify.<locals>.<genexpr>r   T)rO   )r   r   z-Successfully preprocessed all matching files.rH  )rT   getcwdrU   rV   r   rW  exitrstripshutilcopytreer   maprt   r%   rP   r   r   ra   pathlibr|  extendrglobr#   r&   r"   rK   rN   rX  r'   r   )rs  rt  ru   ru  r   r   r   rv  r   r   r   r   r   rw  r   r   Zall_files_setrk   r|  r=  Zheader_include_dir_pathr   r   r   )ru  r   r   r   rs  r   r=   F  s\   








r=   )r   r   r   FFrn   )Frp  rq  r   r   rr  r   Fr   TFFFN)cro   rm  r   r   r  rW  rT   r   r   Zcuda_to_hip_mappingsr   r   typingr   collections.abcr   r   r	   enumr
   r+  r  r   r   dictr~  ZHipifyFinalResultrK  r   __annotations__ZPYTORCH_TEMPLATE_MAP__all__r"  r    r!   r"   r#   rt   boolr$   r   r%   r   r&   r'   r(   compiler   r)   r*   r+   r,   Z	RE_ASSERTr-   r   r.   r   r/   r0   r1   r2   r3   r4   r5   r	  r6   ZCAFFE2_TRIEr7  ZPYTORCH_TRIEr-  objectr4  mappingr   itemssrcri   dstZ	meta_dataZ
API_CAFFE2rW   ZAPI_SPECIALr5  ZAPI_PYTORCHr*  rO  rN  rP  rQ  rR  rS  r7   r8   r9   r:   Z
RE_INCLUDEr;   r<   r=   r   r   r   r   <module>   s  	
"
,
		

# &



H
^








		
 
9
.	
