U
    ,d5                     @   s$  d dl Z d dlZd dlZd dlmZ d dlZd dlZd dlZ	d dl
mZmZmZmZmZ d dlmZmZ d dlmZ d dl
mZmZ d dlmZmZmZmZmZmZmZmZmZ d dl m!Z! d d	l"m#Z# d
d Z$G dd de%Z&dd Z'G dd de%Z(dd Z)dd Z*dd Z+dd Z,dd Z-dS )    N)add)typesirrewritesconfigir_utils)infer_globalAbstractTemplate)	signature)utilstyping)	get_call_tablemk_unique_varcompile_to_numba_irreplace_arg_nodesguardfind_callnamerequire
find_constGuardException)NumbaValueError)OPERATORS_TO_BUILTINSc                 C   s   |dkr| | S | S d S Nr    )dim_sizeindex_constr   r   @/tmp/pip-unpacked-wheel-eu7e0c37/numba/stencils/stencilparfor.py_compute_last_ind   s    r   c                   @   sT   e Zd Zdd Zdd Zdd Zdd Zd	d
 Zdd Zdd Z	dd Z
dd ZdS )StencilPassc                 C   s.   || _ || _|| _|| _|| _|| _|| _d S N)func_irtypemap	calltypesarray_analysis	typingctx	targetctxflags)selfr    r!   r"   r#   r$   r%   r&   r   r   r   __init__!   s    zStencilPass.__init__c                    s  ddl m} t jj\}}g }i }| D ].\}}|D ] }t||r8|| |||< q8q,|sddS  jj D ]\}	}
tt	t
|
jD ]\}ttjrtjtjr̈jjdkr̈jjj|krtjj}fddttjjD }jj}t fdd|D }|D ]}t|tjrtd	q|d
}|jjj }t| j||
j|
j | j! j"\}}}|j#dd} $|	||||j%|||	}|
jd| | |
j|d d  |
_qttjrtjtjrjjdkrt&t' jjdkrt(dj _qqpdS )zP Finds all calls to StencilFuncs in the IR and converts them to parfor.
        r   )StencilFuncNcallc                    s   i | ]}| j j| qS r   )valueargs.0i)stmtr   r   
<dictcomp>H   s      z#StencilPass.run.<locals>.<dictcomp>c                 3   s   | ]} j |j V  qd S r   )r!   namer-   r'   r   r   	<genexpr>K   s     z"StencilPass.run.<locals>.<genexpr>zITuple parameters not supported for stencil kernels in parallel=True mode.outindex_offsets   )stencilnumba))Znumba.stencils.stencilr)   r   r    blocksitems
isinstanceappendreversedlist	enumeratebodyr   Assignr+   Expropfuncr2   dictkwsrangelenr,   tupler   Z	BaseTuple
ValueErrorgetget_stencil_irr$   scopelocr!   r"   options_mk_stencil_parfortargetr   r   Const)r'   r)   Z
call_table_Zstencil_callsZstencil_dictZcall_varname	call_listZone_calllabelblockr/   rG   
input_dictin_argsZarg_typemapZarg_typeout_arrsf
stencil_irrtarg_to_arr_dictr6   	gen_nodesr   )r'   r0   r   run+   sx    




    

    (
zStencilPass.runc              	   C   s   |  D ]\}}|j}|j}g }|jD ]x}	t|	tjr| }
t|
tjrdt|
j	tj
rd|
j	jdksht|t|
j	j	|| |t|| q&||	 q&||_qdS )z
        Find return statements in the IR and replace them with a SetItem
        call of the value "returned" by the kernel into the result array.
        Returns the block labels that contained return statements.
        castN)r;   rN   rO   rA   r<   r   ReturnpoprB   r+   rC   rD   AssertionErrorr=   ZJump)r'   r:   exit_value_varparfor_body_exit_labelrV   rW   rN   rO   new_bodyr0   Z	prev_stmtr   r   r   replace_return_with_setitemg   s     

z'StencilPass.replace_return_with_setitemc
           R         s	  g }
|j }tjdkr4td|||||| t| |d }j|j }t|j\}}t	|}t
|||jj tjdkrtd t| t|jj|j tjdkrtd t| j|j j |j}|j}g }t D ].}t|td|}tjj|j< || q||||||	\}}tjdkrhtd td| td	| t| g }j|}||} t|kstg }g }t D ]f}|| || |
||} || |
||}|| || |t!j"j#$|| ||d qt%|& d }t'||||< t|td
|} |j(j| j< g }! dkrd|d }"nPt|td|}"tj)*tj j|"j< tj+,||}#t-|#|"|}$|!|$ tjdkrtd t| t'||}%dkrj|j }td}&t||&|}'tj+.|d|}(tj)*tj|jj|&< |%j/0t-|(|'|g td})t||)|d|j1kr|j1d }*t2j33|*}+j45|+|j(st6d|(|*},n
|(d},t7|,|}-|j(j|)< |%j/0t-|-|g td}.t||.|t!j8jj9:|j(|j|j;jj< t|td|}/tj<=t>j|/j< t?dt>|}0t-|0|/|}1|%j/|1 tj+.|/|j(j|}2t|td|}3tj@A|j(j|3j< t-|2|3|}4|%j/|4 tBdt>jC|'|3gj4jj}5t|td|}6t-t7d||6|}7|5|7 tjDj|6j< t|td|}8t-t7d||8|}9|5|9 tjj|8j< t|td|}:j4EtF};|;j|:j< t?dtF|}<t-|<|:|}=|5|= j4G|;tjDfd i }>tj+jH|:|6|6fd|d}?|>j|?< t|td|}@tjIj|@j< t-|?|@|}=|5|=  fd d!}At|jD ]V}B|@g|j }C|@g|j }D|A|;|B|||:|5||C|8d"
 |A|;|B|||:|5||D||B d#
 qD|J| |%j/0|5 nd|j1kr^|j1d }*t2j33|*}+j45|+|j(sd}EtK|Et|td$|}@j4EtF};|;j|@j< t?dtF|}<t-|<|@|}F|%j/|F j4G|;tjDfd i }>tj+jH|@dd|d}G|>j|G< t|td%|}HtjIj|Hj< t-|G|H|}=|%j/|= t7|(|*|}It|td&|}J|j(j|Jj< t-|I|J|}K|%j/|K tLtFdd|H|J|}L|%j/|L tMtjDjj j|Hj jj j(}>|>j|L< N|| | tjdkrtd' t| tO|"| |}MtMtjDjj j|"j jj j(j|M< || j/0|! || j/|M tPd(d)}Nt|td&|N}Ot-tj7d|Nd*|O|N}K|| j/|K || j/tQ|O|N tR|}|t%|&  j/S  tjdk	rtd+ t| d,||gf}Pt!j"j#T||%|||"||PjU}Q|
|Q |
t-|| |
S )-z> Converts a set of stencil kernel blocks to a parfor.
        r7   rQ   r   z#stencil_blocks after copy_propagatez'stencil_blocks after removing dead codez$parfor_index_varz-stencil_blocks after replace stencil accesseszstart_lengths:zend_lengths:z$parfor_exit_valuez$parfor_index_tuple_varz.stencil_blocks after creating parfor index varNZin_arr_shapeshapeZzero_valcvalz-cval type does not match stencil return type.Zstencil_outputz	$np_g_varnpz$np_attr_attremptyz	$none_varz$zero_index_varz$slice_func_varslice   r   rE   r,   rG   rO   $slicec
                    s  j | tjfd i }
|| }t|ttjfs4tt|t	d|}tjj
|j< t|trvtt||||}nt|||}|| tjj||	r||fn||fd|d}|
j|< t|t	d|}tjj
|j< t|||}|| |||< t|t	d|}tjtj j
|j< tj||}t|||}|| t||}ttjj
j j
|j j
j jj|< || d S )Nrn   z$border_indr   ro   rp   z$border_index_tuple_var)r$   resolve_function_typer   intpr<   intr   Varrd   r   r!   r2   rB   rS   r=   rC   r*   r"   slice2_type
containersUniTuplebuild_tupleSetItemr
   nonedtype)slice_fn_tydimrN   rO   slice_func_varstmtsZborder_indsZborder_tuple_itemsZ	other_argZother_firstsigsiZsi_varZ	si_assignslice_callexprZborder_slice_varslice_assignZborder_ind_var
tuple_calltuple_assignsetitem_callndimsrZ   r'   Zzero_varr   r   handle_border<  sZ    




 
 


z5StencilPass._mk_stencil_parfor.<locals>.handle_borderTFz	$py_g_varz$slice_instz$cval_constz%stencil_blocks after replacing returnZstencilparfor_dummy)rO   z#stencil_blocks after adding SetItemr8   )Vr:   r   DEBUG_ARRAY_OPTprintr   dump_blocksr!   r2   Zcopy_propagateget_name_var_tableZapply_copy_propagater"   Zremove_deadr    	arg_namesndimrN   rO   rH   r   rt   r   r   rr   r=   _replace_stencil_accessesr#   Zget_equiv_setZ	get_shaperI   rd   _get_stencil_last_ind_get_stencil_start_indr9   ZparforsparforZLoopNestmaxkeysZBlockr{   rv   rw   rC   rx   rB   getattrrA   extendrP   r   Ztypeofr$   Zcan_convertrK   rS   coreZnpytypesArrayZlayoutmiscModulerk   Global	functionsZNumberClassZgen_np_callrl   rz   Zresolve_value_typerm   rq   r*   ru   Zinsert_equivr   StaticSetItemr
   rh   ry   ZLocrb   Zsimplify_CFGrc   ZParforr&   )Rr'   rV   rY   rZ   r\   r6   rR   return_typestencil_funcr^   r_   stencil_blocksin_arrZ
in_arr_typZin_cpsZout_cpsname_var_tablerN   rO   parfor_varsr/   Z
parfor_varstart_lengthsend_lengthsZ	loopnestsZ	equiv_setZin_arr_dim_sizesZ
start_indsZ	last_indslast_indZ	start_indrf   re   Zfor_replacing_retZparfor_ind_varr   r   Z
init_blockZ
shape_nameZ	shape_varZshape_getattrZ	zero_namerj   Zcval_tyZtemp2Z
full_constZso_nameZdtype_g_np_varZ
dtype_g_npZdtype_g_np_assignZdtype_np_attr_callZdtype_attr_varZdtype_attr_assignr   Znone_varZnone_assignZzero_index_varZzero_index_assignr~   r|   Zslice_gr   r   r   	slice_varr   r}   Zstart_tuple_itemsZlast_tuple_itemsmsgZslice_assignedZcallexprZslice_inst_varZcval_const_valZcval_const_varZcval_const_assignZsetitemexprr   Z	dummy_locZret_const_varpatternr   r   r   r   rQ      sD   
  





    




      

  


 
















8



  


 






    
zStencilPass._mk_stencil_parforc                 C   s4  |}|dkr0t |td|}tj| j|j< t|tj	rRt 
t ||||}nt 
|||}|| t |td|}tj| j|j< t |td|}	tt}
tj|
}|| j|	j< t d|
|}t 
||	|}|| t j|	||gd|}|| jtjtjgi | j|< t 
|||}|| |S )Nr   Zstencil_const_varr   Zcompute_last_ind_varr   r   )r   rt   r   r   rr   r!   r2   r<   numbersNumberrB   rS   r=   r9   Znjitr   r   Z
Dispatcherr   rC   r*   Zget_call_typer$   r"   )r'   r   Z
end_lengthr_   rN   rO   r   r   const_assignZg_varZ
check_funcZfunc_typZg_objZg_assign
index_callindex_assignr   r   r   r     s>    
 


 
 

z!StencilPass._get_stencil_last_indc           	      C   s   t |trtt|dS dd }t|i | j| jtjf| j	| j
}t|jdksRt|j d }t||g ||jd d 7 }|jd jj}|S )Nr   c                 S   s   t t| dS r   )absmin)Zs_lengthr   r   r   get_start_ind  s    z9StencilPass._get_stencil_start_ind.<locals>.get_start_indr7   )r<   rs   r   r   r   r$   r%   r   rr   r!   r"   rI   r:   rd   popitemr   rA   r+   )	r'   Zstart_lengthr_   rN   rO   r   f_irrW   Zret_varr   r   r   r     s    

  z"StencilPass._get_stencil_start_indc              	      s  j }|d }dd |D }	d|jkr`|jd D ]}
|
 kr0tdq0 fdd|jd D }ng }|j|krvtdj|j j}|j}|j}|jdk}|r|dg }|dg }n d	d |jD }d
d |jD }t	
|}d}| D ]\}}g }|jD ]}t|tjr@t|jtjr@|jjdkr@|jjj|	ksjt|tjs\t|tjrr|jj|	krrtdt|tjrt|jtjr|jjdkr|jjj|	kr|jjj|kr|jj}|dkr|g}n"t|dr|j|kr||j }t	|_fdd|D }|r6|t||||}|rt|tjs^tdd |D rftdttt||}ttt ||}d}|t||||}|dkr|d }nPt|t!d|}t"j#$t"j%|j|j< tj&||}t|||}|'| t(fdd|D r0j|jjj j)}nj|jjj }tj*|jj||}t+|j|jjj j|j j,|< ||_|'| q||_q|r|std||fS )z Convert relative indexing in the stencil kernel to standard indexing
            by adding the loop index variables to the corresponding dimensions
            of the array index tuples.
        r   c                 S   s   g | ]
}|j qS r   )r2   r.   xr   r   r   
<listcomp>&  s     z9StencilPass._replace_stencil_accesses.<locals>.<listcomp>Zstandard_indexingz[Standard indexing requested for an array name not present in the stencil kernel definition.c                    s   g | ]} | qS r   r   r   )r^   r   r   r   -  s     zYThe first argument to a stencil kernel must use relative indexing, not standard indexing.Nc                 S   s   g | ]}|d  qS )r   r   r   r   r   r   r   D  s     c                 S   s   g | ]}|d  qS )r7   r   r   r   r   r   r   E  s     F)setitemZstatic_setitemz?Assignments to arrays passed to stencil kernels is not allowed.)Zstatic_getitemgetitemr7   r2   c                    s   g | ]}t  j|qS r   )_get_const_index_exprr    r.   v)r'   r\   r   r   r   o  s     c                 S   s   g | ]}t |t qS r   r<   rs   r   r   r   r   r   z  s     z<Variable stencil index only possible with known neighborhoodTz$parfor_index_ind_varc                    s   g | ]} j |j tjkqS r   )r!   r2   r   rr   r   r3   r   r   r     s   z=Stencil kernel with no accesses to relatively indexed arrays.)-r:   rP   rK   r2   r!   r   rN   rO   Zneighborhoodr   Zget_tuple_tabler;   rA   r<   r   rB   r+   rC   rD   ry   r   rR   indexhasattrZbuild_definitionsZ_definitions_add_index_offsetsr?   rt   anymapr   r   r   r   rv   rw   rr   rx   r=   allr{   r   r
   r"   )r'   r\   r   rY   r6   r   r^   r   r   Zin_arg_namesr   Zstandard_indexedr   rN   rO   Zneed_to_calc_kernelr   r   Ztuple_tableZfound_relative_indexrV   rW   rg   r0   
index_list
index_varsZind_varr   r   Zgetitem_return_typZgetitem_callr   )r^   r'   r\   r   r     s    













      

 



z%StencilPass._replace_stencil_accessesc                 C   s<  t |t |ksttdd || D r:ttt||S g }g }tt |D ]}|| }	t|	trt	
|td|}	tj| j|	j< t	t	|| ||	|}
||
 || }t|trt	
|td|}tj| j|j< t	t	|| |||}
||
 t|	ts&t| j|	j tjjr\| j|j tjks>t| |	||||}|| qNt|tst| j|j tjjr| j|	j tjkst| ||	|||}|| qNt	
|td|}tj| j|j< t	jtj|	||}| jtjtjtjfi | j|< t	|||}|| || qN|| |S )zw Does the actual work of adding loop index variables to the
            relative index constants or variables.
        c                 S   s   g | ]}t |tqS r   r   r   r   r   r   r     s     z2StencilPass._add_index_offsets.<locals>.<listcomp>old_index_var
offset_varZoffset_stencil_index)rI   rd   r   r?   r   r   rH   r<   rs   r   rt   r   r   rr   r!   r2   rB   rS   r=   rm   r   Z	SliceType_add_offset_to_slicerC   binopoperatorr$   rq   r"   r   )r'   r   r6   rg   rN   rO   	out_nodesr   r/   r   r   r   	index_varr   r   r   r   r   r     s    
  
  
  
  
   
 


zStencilPass._add_index_offsetsc                 C   s   t |trBd|j|j}i }t|i | |d }|g}tjf}	n&dd }||g}| j|j	 }
|
tjf}	| j
jjj}t||| j| j|	| j| j}|j \}}t|| |jd jj}||jd d  |S )NzRdef f(offset):
                return slice({} + offset, {} + offset)
            fc                 S   s   t | j| | j| S r   )rm   startstop)Z	old_sliceoffsetr   r   r   r     s    z+StencilPass._add_offset_to_slice.<locals>.fr   )r<   rm   formatr   r   execr   rr   r!   r2   r    Zfunc_idrE   __globals__r   r$   r%   r"   r:   r   r   rA   r+   r   )r'   r   r   r   rN   rO   Zf_textr   r,   Zarg_typsZ
slice_typeZ_globalsr   rT   rW   Z	new_indexr   r   r   r     s2    
 

  
z StencilPass._add_offset_to_sliceN)__name__
__module____qualname__r(   r`   rh   rQ   r   r   r   r   r   r   r   r   r   r       s   
<  o" Dr   c                 C   s  ddl m} ddlm}	 ddlm}
 ddlm} | j	 }t	
|j}||_t|j}d|krhtdddlm}	 |	j}|	|| t||||}tjd|j ||jj|jj|jj|jjd	\|j_|j_|j_}|
j|jj|jj|jjd
d	|jj|jjtjd W 5 Q R X t |t! }t"|# }t$|# }tj%&| tj'dkrft(d t)| i }|jj* D ].\}}t+,|t-||}|||< |||j.< qvt/|| tj'dkrt(d t)| |jj* D ]\}}|||< qi }|0 D ]}|j1D ]t}t2|t+j3rt2|j4t+j5rtj'dkrTt(d||j4j6|j4j.|j4j6|k ||j4j6 j.||j4j.< ||j4j6 |_4qqtj'dkrt(d| t(d t)| t7| ||_|| 8|d |fS )z'get typed IR from stencil bytecode
    r   )
CPUContext)
cpu_target)type_annotations)type_inference_stager5   z6Cannot use the reserved word 'out' in stencil kernels.zbefore-inferenceNr   )r    r!   r"   ZliftedZlifted_fromr,   r   Zhtml_outputr7   zInitial stencil_blockszAfter replace_varsrX   r^   zAfter replace arg with arr)9Znumba.core.cpur   Znumba.core.registryr   Znumba.core.annotationsr   Znumba.core.typed_passesr   Z	kernel_ircopydeepcopyr:   r   r   rK   Ztarget_contextZnested_contextDummyPipeliner   Zrewrite_registryapplystater$   r%   r    r,   r!   r   r"   ZTypeAnnotationr   ZHTMLZadd_offset_to_labelsZ
next_labelr   r   r   Z_the_max_labelupdater   r   r   r;   r   rt   r   r2   Zreplace_varsvaluesrA   r<   rB   r+   ZArgr   Zremove_delsZget_return_type)r[   r$   r,   rN   rO   rX   r!   r"   r   r   r   r   Zstencil_func_irr   r   r%   tprT   Z	min_labelZ	max_labelZvar_dictr   typZnew_varr*   Zcall_typr^   rW   r0   r   r   r   rM   	  s    
   


 



rM   c                   @   s   e Zd Zdd ZdS )r   c                 C   sP   ddl m} | | _|| j_|| j_|| j_|| j_d | j_d | j_d | j_	d S )Nr   )	StateDict)
Znumba.core.compilerr   r   r$   r%   r,   r    r!   r   r"   )r'   r$   r%   r,   r   r   r   r   r   r(   b  s    zDummyPipeline.__init__N)r   r   r   r(   r   r   r   r   r   a  s   r   c                 C   s   t t| ||}|dk	r|S |S )z
    infer index_var as constant if it is of a expression form like c-1 where c
    is a constant in the outer function.
    index_var is assumed to be inside stencil kernel
    N)r   _get_const_index_expr_inner)r\   r    r   	const_valr   r   r   r   n  s       r   c                 C   sr   t t|tj tt| ||}|dk	r*|S t| |}tt| ||}|dk	rP|S tt	| ||}|dk	rj|S t
dS )zWinner constant inference function that calls constant, unary and binary
    cases.
    N)r   r<   r   rt   r   _get_const_two_irsr   Zget_definition_get_const_unary_expr_get_const_binary_exprr   )r\   r    r   	var_const	index_defr   r   r   r   z  s,          r   c                 C   s8   t t| |}|dk	r|S t t||}|dk	r0|S tdS )zWget constant in either of two IRs if available
    otherwise, throw GuardException
    N)r   r   r   )Zir1Zir2varr   r   r   r   r     s    r   c                 C   sF   t t|tjo|jdk |j}t| ||}t|j }t	d
||S )zQevaluate constant unary expr if possible
    otherwise, raise GuardException
    Zunaryz{}{})r   r<   r   rC   rD   r+   r   r   fnevalr   )r\   r    r   Z	inner_varr   rD   r   r   r   r     s
    
r   c                 C   sR   t t|tjo|jdk t| ||j}t| ||j}t|j	 }t
d|||S )zRevaluate constant binary expr if possible
    otherwise, raise GuardException
    r   z{}{}{})r   r<   r   rC   rD   r   lhsrhsr   r   r   r   )r\   r    r   Zarg1Zarg2rD   r   r   r   r     s
    
r   ).r   r   r   Zpytypesr   r   Znumpyrk   Znumba.parfors.parforr9   Z
numba.corer   r   r   r   Znumba.core.typing.templatesr   r	   Znumba.core.typingr
   r   r   Znumba.core.ir_utilsr   r   r   r   r   r   r   r   r   Znumba.core.errorsr   Znumba.core.utilsr   r   objectr   rM   r   r   r   r   r   r   r   r   r   r   <module>   s6   ,     nX