
    ihf                        d Z ddlZddlZddlZddlmZ ddlmZm	Z	m
Z
mZmZ ddlZddlmZ ddlmZ ddlmZ ddlmZmZmZmZ ddlmZ dd	lmZ dd
lm Z  ddl!m"Z"m#Z# ejH                  jK                  d      Z&ejH                  jK                  d      Z'ejH                  jK                  d      Z(d Z) e)       Z*d Z+ G d de jX                        Z-d Z. G d de j^                        Z0d Z1 e       Z2ejH                  jK                  d      Z3 G d de4      Z5da6d Z7da8da9d Z:d Z;d Z<d Z=d Z> e>       Z? e"e?      d         Z@d! ZA e"eA      d"        ZBd# ZC e"eC      d$        ZDe#d%        ZEd& ZF e"eF      d'        ZGe#d(        ZHd)ej                  v ZJ eKej                  j                  d)d            ZMeJr	eMr e<        d* ZNd+ ZO e"eN      d,        ZP e"eO      d-        ZQy).a  
This file implements the code-generator for parallel-vectorize.

ParallelUFunc is the platform independent base class for generating
the thread dispatcher.  This thread dispatcher launches threads
that execute the generated function of UFuncCore.
UFuncCore is subclassed to specialize for the input/output types.
The actual workload is invoked inside the function generated by UFuncCore.
UFuncCore also defines a work-stealing mechanism that allows idle threads
to steal works from other threads.
    N)RLock)	CFUNCTYPEc_intCDLLPOINTERc_uint)ir)as_dtype)typescgutilsconfigerrors)	signature)_wrapper_info)ufuncbuilder)overload	intrinsicdarwinlinuxwin32c                  F    t         j                  } | dk  rt        d      | S )z*
    Gets the available thread count.
       z(Number of threads specified must be > 0.)r   NUMBA_NUM_THREADS
ValueError)ts    U/var/www/html/dev/engine/venv/lib/python3.12/site-packages/numba/np/ufunc/parallel.pyget_thread_countr   $   s'     	  A1uCDDH    c           
      $  !" t        |t              sJ t        j                  d      }t        j                  |      "t        j                  "      }|j                  t        j                        }t        j                  |      }t        j                  t        j                         t        j                  "      t        j                  |      t        j                  |      "g      }	|j                         j                  d      }
|
j                  d      }dj                  t        |j                        |j                         }t        j"                  ||	|      }|j%                  d      }t        j&                  |      !|j(                  \  }}}}|j+                  !      }|j-                         }|j/                         }!"fd}t1        |j(                        }t        |j2                  t        j4                        s|dz  }t        j                  t        j                         "gd	z  |gd
z  z         }t7        j8                  ||d      }t        j                  t        j                         |||"g      }t7        j8                  |||j                         }|
j;                  |j<                         t7        j8                  !j>                  t        j                  t        j                  t        j                  j@                        g       d      }!jC                  |g       }!jE                  |"      }||||fD cg c]
  } ||       } }!jC                  ||g| z   ||fD cg c]
  } ||       c}z   |gz          |jG                  |       |jI                  |       !jK                          |
jM                  |       |
j;                  |        tO        |
|j                   |j                        S c c}w c c}w )a   Wrap the original CPU ufunc/gufunc with a parallel dispatcher.
    This function will wrap gufuncs and ufuncs something like.

    Args
    ----
    ctx
        numba's codegen context

    info: (library, env, name)
        inner function info

    sig
        type signature of the gufunc

    inner_ndim
        inner dimension of the gufunc (this is len(sig.args) in the case of a
        ufunc)

    Returns
    -------
    wrapper_info : (library, env, name)
        The info for the gufunc wrapper.

    Details
    -------

    The kernel signature looks like this:

    void kernel(char **args, npy_intp *dimensions, npy_intp* steps, void* data)

    args - the input arrays + output arrays
    dimensions - the dimensions of the arrays
    steps - the step size for the array (this is like sizeof(type))
    data - any additional data

    The parallel backend then stages multiple calls to this kernel concurrently
    across a number of threads. Practically, for each item of work, the backend
    duplicates `dimensions` and adjusts the first entry to reflect the size of
    the item of work, it also forms up an array of pointers into the args for
    offsets to read/write from/to with respect to its position in the items of
    work. This allows the same kernel to be used for each item of work, with
    simply adjusted reads/writes/domain sizes and is safe by virtue of the
    domain partitioning.

    NOTE: The execution backend is passed the requested thread count, but it can
    choose to ignore it (TBB)!
       parallelgufuncwrapperzparallel.gufunc.wrapperz.kernel.{}_{})name c                 (    j                  |       S N)bitcast)argbuilder
byte_ptr_ts    r   as_void_ptrz(build_gufunc_kernel.<locals>.as_void_ptr   s    sJ//r   r         numba_parallel_forget_num_threads)libraryr"   env)(
isinstancetupler	   IntTypePointerTypeget_value_typer   intpFunctionTypeVoidTypecodegencreate_librarycreate_ir_moduleformatidr0   r"   Functionappend_basic_block	IRBuilderargsget_python_api
gil_ensuresave_threadlenreturn_typeNoneTyper   get_or_insert_functionadd_linking_libraryr/   modulebitwidthcallr&   restore_threadgil_releaseret_voidadd_ir_moduler   )#r/   ctxinfosig
inner_ndimbyte_tbyte_ptr_ptr_tintp_t
intp_ptr_tfnty
wrapperlibmodkernel_namelfuncbb_entryrA   
dimensionsstepsdatapyapi	gil_statethread_stater*   array_countparallel_for_typarallel_forinnerfunc_fntytmp_voidptrr.   num_threadsfnptrx	innerargsr(   r)   s#                                    @@r   build_gufunc_kernelrn   1   sQ   ` dE"""ZZ]F'J^^J/N

+F'J??2;;=2>>*+E+->>&+A+->>&+A+5+7 8D --.EFJ

%
%&?
@C!((DHHtyyAKKKT4E''+H ll8$G$)JJ!D*eT
 w'E  "I$$&L0 chh-Kcoou~~6qoobkkm'1lQ&6&a&GIO11#2FHL __
	Z<N 00n15=K""4<<044


5::#6#67<O
 ,,3K OOK4E:ud35AQ 5I 5LLw2&0+%>?&)? @CN- P Q 
&	i S!""7+%**$((KK5 @s   P6Pc                       e Zd Zd Zy)ParallelUFuncBuilderc                    t                |j                  }|j                  }|j                  }|j                  j
                  }t        |||||      }|j                  j                  |j                        }|j                  D 	cg c]+  }	t        j                  |	j                        j                  - }
}	|
j                  t        j                  |j                  j                        j                         d}|
||fS c c}	w )N )_launch_threadstarget_contextr   r/   fndescllvm_func_namebuild_ufunc_wrapperget_pointer_to_functionr"   rA   npdtypenumappendrF   )selfcresrS   rQ   r   r/   fnamerR   ptra	dtypenums	keepalives               r   buildzParallelUFuncBuilder.build   s     !!NN	,,**"7C	4Hll22499=3<>>BaRXXaff%))B	B)"7"7"<"<=AAB	#y(( Cs   0DN)__name__
__module____qualname__r   rr   r   r   rp   rp      s    )r   rp   c           	          t        j                  | |||d|      }t        | |||t        |j                              }|S )NF)objmoder~   )r   rw   rn   rE   rA   )r/   rQ   r   r   r~   	innerfuncrR   s          r   rw   rw      sE    00#u1:E6:<I wY	"9>>24DKr   c                   .     e Zd Zddi df fd	Zd Z xZS )ParallelGUFuncBuilderNFrr   c                 p    |j                  t        d             t        t        |   	 ||||||       y )NT)nopython)py_funcr   identitycachetargetoptionswritable_args)updatedictsuperr   __init__)r}   r   r   r   r   r   r   	__class__s          r   r   zParallelGUFuncBuilder.__init__   sE     	T401!	''  )r   c                    t                t        | j                  || j                  | j                  | j
                  d      }|j                  j                  |j                        }|j                  }g }|j                  j                  D ]O  }t        |t        j                        r|j                  }n|}|j!                  t#        |      j$                         Q |||fS )zJ
        Returns (dtype numbers, function ptr, EnvironmentObject)
        Fr   
is_parfors)rs   build_gufunc_wrapperr   sinsoutr   r/   rx   r"   r0   r   rA   r1   r   Arrayrz   r|   r
   r{   )r}   r~   rR   r   r0   r   r   tys           r   r   zParallelGUFuncBuilder.build   s     	 $LL$$))4::
 ll22499=hh 	$$ 	/A!U[[)WWXb\--.	/ #s""r   )r   r   r   r   r   __classcell__)r   s   @r   r   r      s    48!)#r   r   c                    |j                   }|j                  }|j                  }t        j                  | |||||      }	t        d |D              }
t        d |D              }t        |
|z        }t        |||	||      }|S )zBuild gufunc wrapper for the given arguments.
    The *is_parfors* is a boolean indicating whether the gufunc is being
    built for use as a ParFors kernel. This changes codegen and caching
    behavior.
    r   c              3   .   K   | ]  }|D ]  }|   y wr%   rr   .0termsyms      r   	<genexpr>z'build_gufunc_wrapper.<locals>.<genexpr>  s     5555   c              3   .   K   | ]  }|D ]  }|   y wr%   rr   r   s      r   r   z'build_gufunc_wrapper.<locals>.<genexpr>  s     7$$73#7#7r   )r/   rt   r   r   r   setrE   rn   )r   r~   r   r   r   r   r/   rQ   r   	innerinfosym_insym_outrT   rR   s                 r   r   r      s     llG


CI11sD*I 555F7$77GVg%&JiJD Kr   c                       e Zd ZdZd Zd Zy)_nopzA no-op contextmanager
    c                      y r%   rr   )r}   s    r   	__enter__z_nop.__enter__       r   c                      y r%   rr   )r}   rA   s     r   __exit__z_nop.__exit__#  r   r   N)r   r   r   __doc__r   r   rr   r   r   r   r     s    r   r   c                  n   	 t         5  dd l} d| j                         v st        r!| j	                         }|j                         an
t               ad d d        y # 1 sw Y   y xY w# t        $ rF}d}t        j                  |t        |      z  t        j                         t               aY d }~y d }~ww xY w)Nr   forkaA  Could not obtain multiprocessing lock due to OS level error: %s
A likely cause of this problem is '/dev/shm' is missing or read-only such that necessary semaphores cannot be written.
*** The responsibility of ensuring multiprocessing safe access to this initialization sequence/module import is deferred to the user! ***
)_backend_init_thread_lockmultiprocessingget_start_method_windowsget_contextr   _backend_init_process_lockr   OSErrorwarningswarnstrr   NumbaSystemWarning)r   rQ   emsgs       r   _set_init_process_lockr   *  s    ,
 ' 	4"99;;x%113-0YY[*-1V*	4 	4 	4  , 	 	cCFlF$=$=>%)V",s5   A% AAA% A"A% "A% %	B4.<B//B4Fc                  0    t         t        d      t         S )zM
    Get the name of the threading layer in use for parallel CPU targets
    z#Threading layer is not initialized.)_threading_layerr   rr   r   r   threading_layerr   O  s     >??r   c                     	 t         rd} nt        rd} nt        rd} nt        d      t	        |       }|j
                  }g |_        t        |_         |       }|dk  r=d|z  }t        j                  |      }t        j                  |       t        d|z        y# t        t        f$ r}t        d|z        d}~ww xY w)	zF
    Checks that if TBB is present it is of a compatible version.
    z	tbb12.dllzlibtbb.12.dylibzlibtbb.so.12zUnknown operating systemi/  zThe TBB threading layer requires TBB version 2021 update 6 or later i.e., TBB_INTERFACE_VERSION >= 12060. Found TBB_INTERFACE_VERSION = %s. The TBB threading layer is disabled.zProblem with TBB. Reason: %sN)_IS_WINDOWS_IS_OSX	_IS_LINUXr   r   TBB_runtime_interface_versionargtypesr   restyper   NumbaWarningr   r   ImportErrorr   )libtbb_namelibtbbversion_functbb_iface_verr   problemr   s          r   _check_tbb_version_compatibler   Y  s    >%K+K(K788k";; "$$5 2 6C	CC
 ))#.GMM'"<sBCC !   > 81<==>s   BB B=*B88B=c                    
 t         s
t                t         5  t        5  t        r	 d d d        d d d        y d fd} t	        t
        j                        j                         }t
        j                  }t        |      dk(  rt        |      h dk(  st        d|z        d }t               
d
d<   d
d	<   g }
fd
}||v r@ |      }|s3|dk(  r|j                  d       n|dk(  rt        r|j                  d	       |}n|dv rdg}|j                  d       |dk(  rn|dk(  r)t        r|j                  d	       |j                  d       nU|dk(  r@t        s|j                  d       t        r|j                  d	       |j                  d       nd}t        ||z         | |      \  }}nK|dk(  r6 | |      \  }}|s9|j                  d       t        r"|j                  d	       nd}t        ||z        |s ||       t!        j"                  d|j$                         t!        j"                  d|j&                         t!        j"                  d|j(                         t!        j"                  d|j*                         t!        j"                  d|j,                          t/        d t0              |j2                        }	 |	t4               t7        |       |adad d d        d d d        y # 1 sw Y   xY w# 1 sw Y   y xY w)Nc                    d}| j                  d      r	 t                ddlm} |S | j                  d      r		 ddlm} |S | j                  d      rddlm} |S d	}t        || z        # t        $ r Y |S w xY w# t        $ r Y |S w xY w)
zZ
                Loads a specific threading layer backend based on string
                Ntbbr   )tbbpoolomp)omppool	workqueue)r   z/Unknown value specified for threading layer: %s)
startswithr   numba.np.ufuncr   r   r   r   r   )backendlibr   s      r   select_known_backendz-_launch_threads.<locals>.select_known_backend  s     %%e,57A 
 ''.A 
 ''4? 
 LC$S7]33 '  
 '  
s"   A* A: *	A76A7:	BBc                 @    d}| D ]  } |      }| ||fS  d}||fS )z_
                Selects from presented backends and returns the first working
                Nr#   rr   )backendsr   r   r   s      r   select_from_backendsz-_launch_threads.<locals>.select_from_backends  sH     ' !G.w7C G|#!
 !GG|#r   r,   >   r   r   r   z]THREADING_LAYER_PRIORITY invalid: %s. It must be a permutation of {'tbb', 'omp', 'workqueue'}z3Intel TBB is required, try:
$ conda/pip install tbbTBBz?Intel OpenMP is required, try:
$ conda/pip install intel-openmpOSX_OMPc                     d}d}t        |       dk(  rd}t        |       dk(  r|| d      z  }t        |       dkD  r*dj                  | D cg c]  }|   	 c}      }|d|z  z  }t        |z        c c}w )Nz&No threading layer could be loaded.
%szHINT:
%sr   r#   r   z
OR
z
One of:
%s)rE   joinr   )requirederrmsghintmsghintrl   optionserr_helperss         r   raise_with_hintz(_launch_threads.<locals>.raise_with_hint  s    B%x=A%Dx=A%"[!%==Dx=1$&mmX,N[^,NOG"mg&=>D $// -Os   A5r   r   )
threadsafeforksafesafer   r   r   r   z+No threading layer available for purpose %sdefaultz7The threading layer requested '%s' is unknown to Numba.r-   do_scheduling_signeddo_scheduling_unsignedallocate_scheddeallocate_schedT)r   r   r   _is_initializedr   r   THREADING_LAYERlowerTHREADING_LAYER_PRIORITYrE   r   r   r   r|   r   r   ll
add_symbolrg   r   r   r   r   r   r   launch_threadsNUM_THREADS_load_threading_functionsr   )r   r   namedbackendsr   requirementsr   libname	availabler   r  r   r   s             @@r   rs   rs   {  s   % 	# R#& Q	#Q	#R# R#6$ F**+113A";;M&!+&*EE 2 $$  C&K#<K'IK	"L
0 M!*1- Ez$++E2e$++I688"G	##E*;,&$++I6$$U+*_ %!((/$++I6$$[1GC$S1W--3I>Wi  4MBW ''.$++I6O q)) -MM.0@0@AMM0#2J2JKMM2C4N4NOMM*C,>,>?MM,c.B.BC3YtU3C4F4FGN;'%c*  '"OcQ	#R# R#Q	# Q	#R# R#s-   K?K3K?J)K3"K?3K<	8K??Lc           
      n   t        j                  d| j                         t        j                  d| j                         t        j                  d| j                          t        d t              | j                        at        t                t        t              | j                        a	 t        t              | j                        a
t        j                  d| j                         t        j                  d| j                         t        j                  d| j                          t        t        t              | j                        a t        t              | j                        a t        t        t        t        t#        t              t#        t                    | j                        ay )Nr.   set_num_threadsget_thread_idset_parallel_chunksizeget_parallel_chunksizeget_sched_size)r   r   r.   r	  r
  r   r   _set_num_threadsr  _get_num_threads_get_thread_idr  r  r  r   _set_parallel_chunksize_get_parallel_chunksizer   _get_sched_size)r   s    r   r  r    sH   MM#S%8%89MM#S%8%89MM/3#4#45 .yu-c.A.AB[! (y'(;(;< &Yu%c&7&78NMM*C,F,FGMM*C,F,FGMM"C$6$670i(.0030J0JL 0i/0J0JK0i & & ' '	0 140B0B	DOr   c                  ,    ddl m dz  fd} | S )Nr   )r   z.The number of threads must be between 1 and %sc                 0    | kD  s| dk  rt              y )Nr   )r   )nr   r   s    r   	snt_checkz gen_snt_check.<locals>.snt_check:  s!      AES/! %*r   )numba.core.configr   )r  r   r   s    @@r   gen_snt_checkr  6  s    3
:=N
NC" r   c                     t         S r%   )r  r  s    r   ol_snt_checkr  C  s    r   c                     t                t        | t        t        j                  f      st        d      t        |        t        |        y)a  
    Set the number of threads to use for parallel execution.

    By default, all :obj:`numba.config.NUMBA_NUM_THREADS` threads are used.

    This functionality works by masking out threads that are not used.
    Therefore, the number of threads *n* must be less than or equal to
    :obj:`~.NUMBA_NUM_THREADS`, the total number of threads that are launched.
    See its documentation for more details.

    This function can be used inside of a jitted function.

    Parameters
    ----------
    n: The number of threads. Must be between 1 and NUMBA_NUM_THREADS.

    See Also
    --------
    get_num_threads, numba.config.NUMBA_NUM_THREADS,
    numba.config.NUMBA_DEFAULT_NUM_THREADS, :envvar:`NUMBA_NUM_THREADS`

    2The number of threads specified must be an integerN)rs   r1   intry   integer	TypeErrorr  r  r  s    r   r	  r	  H  s8    . a#rzz*+LMMaLQr   c                     t                t        | t        j                        sd}t	        j
                  |      d }|S )Nr  c                 0    t        |        t        |        y r%   )r  r  r  s    r   implz ol_set_num_threads.<locals>.implm  s    !r   rs   r1   r   Integerr   TypingErrorr  r   r$  s      r   ol_set_num_threadsr)  f  s8    a'B  %% Kr   c                  l    t                t               } | dk  rt        dt               d| d      | S )aM  
    Get the number of threads used for parallel execution.

    By default (if :func:`~.set_num_threads` is never called), all
    :obj:`numba.config.NUMBA_NUM_THREADS` threads are used.

    This number is less than or equal to the total number of threads that are
    launched, :obj:`numba.config.NUMBA_NUM_THREADS`.

    This function can be used inside of a jitted function.

    Returns
    -------
    The number of threads.

    See Also
    --------
    set_num_threads, numba.config.NUMBA_NUM_THREADS,
    numba.config.NUMBA_DEFAULT_NUM_THREADS, :envvar:`NUMBA_NUM_THREADS`

    r   zLInvalid number of threads. This likely indicates a bug in Numba. (thread_id=z, num_threads=))rs   r  RuntimeErrorr
  rj   s    r   r.   r.   s  s=    , "$Ka *O[: ; 	; r   c                       t                d } | S )Nc                  z    t               } | dk  r+t        dt                      t        d|        t        d      | S )Nr   zBroken thread_id: znum_threads: z@Invalid number of threads. This likely indicates a bug in Numba.)r  printr
  r,  r-  s    r   r$  z ol_get_num_threads.<locals>.impl  sD    &(!&8/;/  G H Hr   rs   r$  s    r   ol_get_num_threadsr3    s     Kr   c                 R    t                d }t        t        j                        |fS )Nc                     |j                   }t        j                  t        j                  g       }t        j
                  ||d      }|j                  |g       S )Nr.   rJ   r	   r7   r   rW   rH   rL   contextr(   r   rA   r[   rY   fns          r   r9   z"_iget_num_threads.<locals>.codegen  sE    nnw~~r2++C7HI||B##r   )rs   r   r   r6   	typingctxr9   s     r   _iget_num_threadsr<    s#    $
 UZZ '))r   c                  *    t                t               S )zv
    Returns a unique ID for each thread in the range 0 (inclusive)
    to :func:`~.get_num_threads` (exclusive).
    )rs   r  rr   r   r   r
  r
    s     r   c                       t                d } | S )Nc                      t               S r%   )_iget_thread_idrr   r   r   r$  zol_get_thread_id.<locals>.impl  s      r   r1  r2  s    r   ol_get_thread_idrA    s    !Kr   c                 >    d }t        t        j                        |fS )Nc                     |j                   }t        j                  t        j                  g       }t        j
                  ||d      }|j                  |g       S )Nr
  r6  r7  s          r   r9   z _iget_thread_id.<locals>.codegen  sD    nnw~~r2++CG||B##r   )r   r   r6   r:  s     r   r@  r@    s    $
 UZZ '))r   NUMBA_DYLD_WORKAROUNDc                     t                t        | t        t        j                  f      st        d      | dk  rt        d      t        |       S )N)The parallel chunksize must be an integerr   /chunksize must be greater than or equal to zero)rs   r1   r  ry   r   r!  r   r  r  s    r   r  r    sE    a#rzz*+CDD1uJKK"1%%r   c                  *    t                t               S r%   )rs   r  rr   r   r   r  r    s    "$$r   c                     t                t        | t        j                        sd}t	        j
                  |      d }|S )NrF  c                 8    | dk  rt        d      t        |       S )Nr   rG  )r   r  r  s    r   r$  z'ol_set_parallel_chunksize.<locals>.impl  s     q5NOO&q))r   r%  r(  s      r   ol_set_parallel_chunksizerK    s8    a'9  %%* Kr   c                       t                d } | S )Nc                      t               S r%   )r  rr   r   r   r$  z'ol_get_parallel_chunksize.<locals>.impl  s    &((r   r1  r2  s    r   ol_get_parallel_chunksizerN    s    )Kr   )Rr   ossysr   	threadingr   threadRLockctypesr   r   r   r   r   numpyry   llvmlite.bindingbindingr   llvmliter	   numba.np.numpy_supportr
   
numba.corer   r   r   r   numba.core.typingr   numba.np.ufunc.wrappersr   r   r   numba.extendingr   r   platformr   r   r   r   r   r  rn   UFuncBuilderrp   rw   GUFuncBuilderr   r   r   r   objectr   r   r   r   r   r   r   rs   r  r  r  r  r	  r)  r.   r3  r<  r
  rA  r@  environ_DYLD_WORKAROUND_SETr  get_DYLD_WORKAROUND_VALr  r  rK  rN  rr   r   r   <module>re     s=  
 
 
  * : :    + 5 5 ' 1 ' /
,,
!
!(
+LL##G,	ll%%g.  LH)<44 )&&#L66 &#X0 (M <<""7+6  " ,>    >DV#rDD O	 
) < 
/	 	@ 
/  * *
 
-  * * /"**< 2::>>*A1EF 0&% 

 !
 "
 

 ! "r   