
    /jT                        U d Z ddlZddlZddlmZ ddlmZ ddlmZm	Z	m
Z
 ddlZddlZddlmZmZ ddlmZ dd	lmZ dd
lmZmZmZmZmZ ddlmZmZ da ej                    Z ej                     Z!g a"e#e$eg df         e#e%         f                  e&d<    e'ej(        dd           Z) e            a*dZ+e$ej(        j,                 e&d<   de-fdZ. e.            r%ej(        j/        Z/ej(        j0        Z1ej(        j2        Z3n ed          Z/de4de4fdZ1de4de4fdZ3 ed          de4fd            Z5de-fdZ6dFde-de-fdZ7de-fdZ8d Z9dGd Z:dGd!Z;dGd"Z< G d# d$          Z= G d% d          Z> G d& d'e>          Z?deddfd(Z@dHdede%fd)ZA ed          dHdedeBe%ef         fd*            ZC	 dHdede/fd+ZDde4fd,ZEde4e%z  ej>        z  dej>        fd-ZFded.ede-fd/ZG G d0 d1          ZHd2e
d3         deHfd4ZIdGd5ZJd2eddfd6ZKdHdedefd7ZLdHd8e4dedefd9ZMdHdeddfd:ZNde#e%         fd;ZOde%fd<ZPdej>        dej(        j,        fd=ZQ	 dId?e4de4e%z  ej>        z  ddfd@ZRdIde4e%z  ej>        z  de4fdAZSddBlTmUZUmVZVmWZWmXZXmYZYmZZZm[Z[m\Z\m]Z]m^Z^m_Z_m`Z`maZambZbmcZcmdZdmeZe ddClfmgZgmhZhmiZimjZjmkZkmlZlmmZmmnZnmoZo  e	dDe$e4e4f                   Zpg dEZqdS )Jz
This package introduces support for the XPU backend, specifically tailored for
Intel GPU optimization.

This package is lazily initialized, so you can always import it, and use
:func:`is_available()` to determine if your system supports XPU.
    N)Callable)	lru_cache)AnyNewTypeOptional)_dummy_type_LazySeedTracker)Device   )_get_device_index)graphgraph_pool_handleis_current_stream_capturingmake_graphed_callablesXPUGraph)EventStreamF_queued_calls_xpu_isInBadForkc                      dS NF r       W/home/longshao/multi-rider-rag/.venv/lib/python3.11/site-packages/torch/xpu/__init__.py<lambda>r   &   s     r   r   default_generatorsreturnc                  $    t           j        j        S )z(Return true if compile with XPU support.)torch_C_has_xpur   r   r   _is_compiledr"   +   s    8r   _XpuDevicePropertiesdevicec                      t          d          Nz(PyTorch was compiled without XPU supportNotImplementedErrorr$   s    r   _exchange_devicer*   8       !"LMMMr   c                      t          d          r&   r'   r)   s    r   _maybe_exchange_devicer-   ;   r+   r   )maxsizec                  ^    t                      sdS t          j                                        S )z*Return the number of XPU device available.r   )r"   r   r    _xpu_getDeviceCountr   r   r   device_countr1   ?   s)     >> q8'')))r   c                  &    t                      dk    S )z7Return a bool indicating if XPU is currently available.r   )r1   r   r   r   is_availabler3   G   s     >>Ar   Tincluding_emulationc                 l    t                      sdS | p"t          j                                        j        S )zKReturn a bool indicating if the current XPU device supports dtype bfloat16.F)r3   r   xpuget_device_propertieshas_bfloat16_conversions)r4   s    r   is_bf16_supportedr9   M   s5    >> u 	F9**,,Er   c                  h    t                      sdS t          j                                        j        S )zGReturn a bool indicating if the current XPU device supports dtype tf32.F)r3   r   r6   r7   'has_subgroup_matrix_multiply_accumulater   r   r   is_tf32_supportedr<   W   s,    >> u
 9**,,TTr   c                  .    t           ot                       S )z8Return whether PyTorch's XPU state has been initialized.)_initialized_is_in_bad_forkr   r   r   is_initializedr@   b   s    1 1 111r   c                    t                      r |              d S |                    dd          r.t                              | t	          j                               d S |                    dd          r.t                              | t	          j                               d S t                              | t	          j                    f           d S )Nseed_allFseed)	r@   get_lazy_seed_trackerqueue_seed_all	tracebackformat_stack
queue_seedr   append)callablekwargss     r   
_lazy_callrM   g   s     
G




 ::j%(( 	G--h	8N8P8PQQQQQZZ&& 	G))(I4J4L4LMMMMM   (I,B,D,D!EFFFFFr   c                  "    t                       dS )zInitialize PyTorch's XPU state.
    This is a Python API about lazy initialization that avoids initializing
    XPU until the first time it is accessed. Does nothing if the XPU state is
    already initialized.
    N)
_lazy_initr   r   r   initrP   u   s     LLLLLr   c            	      2   t                      st          t          d          rd S t          5  t                      r	 d d d            d S t	                      rt          d          t                      st          d          t          j	        
                                 dt          _        t                              d t                                          D                        	 t          D ]Z\  } }	  |              # t           $ r=}dt#          |           dd                    |           }t!          |          |d }~ww xY w	 t'          t          d           n# t'          t          d           w xY wdad d d            d S # 1 swxY w Y   d S )	Nis_initializingzuCannot re-initialize XPU in forked subprocess. To use XPU with multiprocessing, you must use the 'spawn' start methodz#Torch not compiled with XPU enabledTc              3      K   | ]}||V  	d S Nr   ).0callss     r   	<genexpr>z_lazy_init.<locals>.<genexpr>   s(      XXuRWXUXXXXXXr   z5XPU call failed lazily at initialization with error: z'

XPU call was originally invoked at:

 )r@   hasattr_tls_initialization_lockr?   RuntimeErrorr"   AssertionErrorr   r    	_xpu_initrR   r   extendrE   	get_calls	Exceptionstrjoindelattrr>   )queued_callorig_tracebackemsgs       r   rO   rO   ~   s0    74):;; 	 ! !  		! ! ! ! ! ! ! !  	I   ~~ 	H !FGGG  $XX0B0L0L0N0NXXXXXX	-/< 0 0+^0KMMMM  0 0 0\PSTUPVPV \ \BD''.BYBY\ \  $C..a/00 D+,,,,GD+,,,,C! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! ! !sT   F
BF*E#7
DE#
E	8EE		E#F#E::FFFc                   8    e Zd ZdeddfdZd Zdededefd	ZdS )
_DeviceGuardindexr   Nc                 "    || _         d| _        d S N)idxprev_idx)selfrk   s     r   __init__z_DeviceGuard.__init__   s    r   c                 X    t           j                            | j                  | _        d S rT   r   r6   r*   ro   rp   rq   s    r   	__enter__z_DeviceGuard.__enter__       	2248<<r   typevaluerG   c                 X    t           j                            | j                  | _        dS r   r   r6   r-   rp   ro   rq   rx   ry   rG   s       r   __exit__z_DeviceGuard.__exit__        933DMBBur   )__name__
__module____qualname__intrr   rv   r   r}   r   r   r   rj   rj      sn        c d    = = =S        r   rj   c                   <    e Zd ZdZd eddfdZd Zdededefd	ZdS )
r$   zContext-manager that changes the selected device.

    Args:
        device (torch.device or int or str): device index to select. It's a no-op if
            this argument is a negative integer or ``None``.
    r   Nc                 @    t          |d          | _        d| _        d S )NToptionalrn   )r   ro   rp   )rq   r$   s     r   rr   zdevice.__init__   s!    $Vd;;;r   c                 X    t           j                            | j                  | _        d S rT   rt   ru   s    r   rv   zdevice.__enter__   rw   r   rx   ry   rG   c                 X    t           j                            | j                  | _        dS r   r{   r|   s       r   r}   zdevice.__exit__   r~   r   )r   r   r   __doc__r   rr   rv   r}   r   r   r   r$   r$      sx         s t    = = =S        r   c                   $     e Zd ZdZd fdZ xZS )	device_ofa  Context-manager that changes the current device to that of given object.

    You can use both tensors and storages as arguments. If a given object is
    not allocated on a XPU, this is a no-op.

    Args:
        obj (Tensor or Storage): object allocated on the selected device.
    r   Nc                     |j         r|                                nd}t                                          |           d S rm   )is_xpu
get_devicesuperrr   )rq   objro   	__class__s      r   rr   zdevice_of.__init__   s<    "%*4cnn"r   r   N)r   r   r   r   rr   __classcell__)r   s   @r   r   r      sG                  r   r   c                     t                       t          |           } | dk    r!t          j                            |            dS dS )zSet the current device.

    Args:
        device (torch.device or int or str): selected device. This function is a
            no-op if this argument is negative.
    r   N)rO   r   r   r    _xpu_setDevicer)   s    r   
set_devicer      sF     LLLv&&F{{''''' {r   c                 *    t          |           j        S )a  Get the name of a device.

    Args:
        device (torch.device or int or str, optional): device for which to
            return the name. This function is a no-op if this argument is a
            negative integer. It uses the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).

    Returns:
        str: the name of the device
    )r7   namer)   s    r   get_device_namer      s     !((--r   c                     t          |           t          t          t          t          t          d          t          t          t          ffdt                    D             S )a  Get the xpu capability of a device.

    Args:
        device (torch.device or int or str, optional): device for which to
            return the device capability. This function is a no-op if this
            argument is a negative integer. It uses the current device, given by
            :func:`~torch.xpu.current_device`, if :attr:`device` is ``None``
            (default).

    Returns:
        dict[str, Any]: the xpu capability dictionary of the device
    Nc                     i | ]:}|                     d           t          t          |          x          7|;S )__)
startswith
isinstancegetattr)rU   keypropsserializable_typesry   s     r   
<dictcomp>z)get_device_capability.<locals>.<dictcomp>  sa       ~~d## !4!447IJJ	U  r   )
r7   r   floatboolrb   rx   listtupledictdir)r$   r   r   ry   s    @@@r   get_device_capabilityr      sl     "&))EudCdT5$O     u::   r   c                 ^    t                       t          | d          } t          |           S )a  Get the properties of a device. Returns _XpuDeviceProperties containing the following device properties:

    - ``name`` (str): device name.
    - ``platform_name`` (str): SYCL platform name.
    - ``vendor`` (str): device vendor.
    - ``device_id`` (int): device identifier (product ID).
    - ``driver_version`` (str): driver version.
    - ``version`` (str): runtime version.
    - ``max_compute_units`` (int): number of parallel compute units.
    - ``gpu_eu_count`` (int): number of EUs (Execution Unit).
    - ``max_work_group_size``: (int): maximum number of work-items permitted in a work-group.
    - ``max_num_sub_groups`` (int): maximum number of sub-groups supported in a work-group.
    - ``sub_group_sizes``: (list[int]): a list of supported sub-group sizes.
    - ``local_mem_size`` (int): device local memory capacity that can be allocated per work-group in bytes.
    - ``has_fp16`` (bool): whether float16 dtype is supported.
    - ``has_fp64`` (bool): whether float64 dtype is supported.
    - ``has_atomic64`` (bool): whether 64-bit atomic operations are supported.
    - ``has_bfloat16_conversions`` (bool): whether bfloat16 conversions are supported.
    - ``has_subgroup_matrix_multiply_accumulate`` (bool): whether DPAS (Dot Product Accumulate Systolic) is supported.
    - ``has_subgroup_matrix_multiply_accumulate_tensor_float32`` (bool): whether DPAS with tf32 inputs is supported.
    - ``has_subgroup_2d_block_io`` (bool): whether 2D block I/O for efficient matrix multiplication is supported.
    - ``total_memory`` (int): device global memory in bytes.
    - ``gpu_subslice_count`` (int): number of subslice.
    - ``architecture`` (int): device architecture identifier (experimental).
    - ``type`` (str): device type, e.g. 'cpu', 'gpu', accelerator', 'host', 'unknown'.
    - ``uuid`` (Any): device UUID (Universal Unique ID), 16 bytes.

    Args:
        device (torch.device or int or str): device for which to return the
            properties of the device.

    Returns:
        _XpuDeviceProperties: the properties of the device
    Tr   )rO   r   _get_device_propertiesr)   s    r   r7   r7     s.    J LLLv555F!&)))r   c                  Z    t                       t          j                                        S )z0Return the index of a currently selected device.)rO   r   r    _xpu_getDevicer   r   r   current_devicer   5  s    LLL8""$$$r   c                     t          | t                    rt          j        |           } n*t          | t                    rt          j        d|           } | S )zReturn the torch.device type object from the passed in device.

    Args:
        device (torch.device or int or str): selected device.
    r6   )r   rb   r   r$   r   r)   s    r   _get_devicer   ;  sO     &# -f%%	FC	 	  -eV,,Mr   peerc                     t                       t          | d          } t          |d          }t          j                            | |          S )a/  Query whether a device can access a peer device's memory.

    Args:
        device (torch.device or int or str): selected device.
        peer (torch.device or int or str): peer device to query access to.

    Returns:
        bool: ``True`` if ``device`` can access ``peer``, ``False`` otherwise.
    Tr   )rO   r   r   r    _xpu_canDeviceAccessPeer)r$   r   s     r   can_device_access_peerr   H  sI     LLLv555FTD111D8,,VT:::r   c                   `    e Zd ZU dZed         ed<   ded         ddfdZd Zd	ed
edefdZ	dS )StreamContexta  Context-manager that selects a given stream.

    All XPU kernels queued within its context will be enqueued on a selected
    stream.

    Args:
        Stream (Stream): selected stream. This manager is a no-op if it's
            ``None``.
    .. note:: Streams are per-device.
    torch.xpu.Stream
cur_streamstreamr   Nc                 ^    || _         t          d d          | _        | j        	d| _        d S d S )NTrn   )r   r   ro   )rq   r   s     r   rr   zStreamContext.__init__f  s5    $T4008DHHH r   c                    | j         }|| j        dk    rd S t          j                            d           | _        | j        j        |j        k    rUt          |j                  5  t          j                            |j                  | _        d d d            n# 1 swxY w Y   t          j                            |           d S rm   )	r   ro   r   r6   current_streamsrc_prev_streamr$   dst_prev_stream
set_stream)rq   r   s     r   rv   zStreamContext.__enter__l  s    [
RF$y77== &**;;;
)** S S',y'?'?
@Q'R'R$S S S S S S S S S S S S S S S	Z(((((s   $*BB!Brx   ry   rG   c                     | j         }|| j        dk    rd S | j        j        |j        k    r$t          j                            | j                   t          j                            | j                   d S rm   )r   ro   r   r$   r   r6   r   r   )rq   rx   ry   rG   r   s        r   r}   zStreamContext.__exit__x  sl    [
RF &**;;;I  !5666	T122222r   )
r   r   r   r   r   __annotations__rr   rv   r   r}   r   r   r   r   r   X  s         	 	 +,,,,x(:;     
) 
) 
)3S 3 3 3 3 3 3 3 3r   r   r   r   c                      t          |           S )zWrap around the Context-manager StreamContext that selects a given stream.

    Arguments:
        stream (Stream): selected stream. This manager is a no-op if it's ``None``.
    )r   r   s    r   r   r     s        r   c                 J    t           j                            | ||           dS )a  set stream specified by the stream id, device index and device type

    Args: stream_id (int): not visible to the user, used to assigned to the specific stream.
          device_index (int): selected device index.
          device_type (int): selected device type.
    	stream_iddevice_indexdevice_typeN)r   r    _xpu_setStreamr   s      r   _set_stream_by_idr     s6     
H!      r   c                 l    | dS t                       t          | j        | j        | j                   dS )a  Set the current stream. This is a wrapper API to set the stream.
        Usage of this function is discouraged in favor of the ``stream``
        context manager.

    Args:
        stream (Stream): selected stream. This function is a no-op
            if this argument is ``None``.
    Nr   )rO   r   r   r   r   r   s    r   r   r     sJ     ~LLL"(&     r   c                     t                       t          j                            t	          | d                    }t          |d         |d         |d                   S )aR  Return the currently selected :class:`Stream` for a given device.

    Args:
        device (torch.device or int, optional): selected device. Returns
            the currently selected :class:`Stream` for the current device, given
            by :func:`~torch.xpu.current_device`, if :attr:`device` is ``None``
            (default).
    Tr   r   r      r   )rO   r   r    _xpu_getCurrentStreamr   r   )r$   
streamdatas     r   r   r     sa     LLL//&4000 J Q-jmTU   r   data_ptrc                     t                       t          j                            | t	          |d                    }t          |d         |d         |d                   S )a;  Return a :class:`Stream` from an external SYCL queue.

    This function is used to wrap SYCL queue created in other libraries in order
    to facilitate data exchange and multi-library interactions.

    .. note:: This function doesn't manage the queue life-cycle, it is the user
       responsibility to keep the referenced queue alive while this returned stream is
       being used. The different SYCL queue pointers will result in distinct
       :class:`Stream` objects, even if the SYCL queues they dereference are equivalent.

    Args:
        data_ptr(int): Integer representation of the `sycl::queue*` value passed externally.
        device(torch.device or int, optional): the device where the queue was originally created.
            It is the user responsibility to ensure the device is specified correctly.
    Tr   r   r   r   r   )rO   r   r    _xpu_getStreamFromExternalr   r   )r   r$   r   s      r   get_stream_from_externalr     sd      LLL44#FT::: J Q-jmTU   r   c                 ~    t                       t          | d          } t          j                            |           S )a*  Wait for all kernels in all streams on a XPU device to complete.

    Args:
        device (torch.device or int, optional): device for which to synchronize.
            It uses the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    Tr   )rO   r   r   r    _xpu_synchronizer)   s    r   synchronizer     s5     LLLv555F8$$V,,,r   c                      t                      sg S t          j                                        } | g S |                                 S )z<Return list XPU architectures this library was compiled for.)r"   r   r    _xpu_getArchFlagssplit)
arch_flagss    r   get_arch_listr     sC    >> 	++--J	r   c                      t                      } t          |           dk    rdS dd                    d | D                        S )zIReturn XPU AOT(ahead-of-time) build flags this library was compiled with.r   rX   z-device ,c              3      K   | ]}|V  d S rT   r   )rU   archs     r   rW   z$get_gencode_flags.<locals>.<genexpr>  s"      ::t::::::r   )r   lenrc   )	arch_lists    r   get_gencode_flagsr     sJ    I
9~~r<chh::	:::::<<<r   c                 ^    | j         }|t                      }t          j        j        |         S )zuReturn the XPU Generator object for the given device.

    Args:
        device (torch.device): selected device.
    )rk   r   r   r6   r   )r$   ro   s     r   _get_generatorr     s+     ,C
{9',,r   r6   offsetc                 T     t          |          d fd}t          |           dS )a$  Set the random number generator state offset of the specified GPU.

    Args:
        offset (int): The desired offset
        device (torch.device or int, optional): The device to set the RNG state.
            Default: ``'xpu'`` (i.e., ``torch.device('xpu')``, the current XPU device).
    r   Nc                  P    t                    } |                                d S rT   )r   
set_offset)default_generatorfinal_devicer   s    r   cbz!_set_rng_state_offset.<locals>.cb  s+    *<88$$V,,,,,r   r   )r   rM   )r   r$   r   r   s   `  @r   _set_rng_state_offsetr     sG     v&&L- - - - - - - rNNNNNr   c                     t                       t          |           }t          |          }|                                S )aL  Return the random number generator state offset of the specified GPU.

    Args:
        device (torch.device or int, optional): The device to return the RNG state offset of.
            Default: ``'xpu'`` (i.e., ``torch.device('xpu')``, the current XPU device).

    .. warning::
        This function eagerly initializes XPU.
    )rO   r   r   
get_offset)r$   r   r   s      r   _get_rng_state_offsetr     s:     LLLv&&L&|44'')))r   )change_current_allocatorempty_cacheget_per_process_memory_fractionmax_memory_allocatedmax_memory_reservedmem_get_infomemory_allocatedmemory_reservedmemory_snapshotmemory_statsmemory_stats_as_nested_dictMemPoolreset_accumulated_memory_statsreset_peak_memory_statsset_per_process_memory_fractionuse_mem_poolXPUPluggableAllocator)	get_rng_stateget_rng_state_allinitial_seedmanual_seedmanual_seed_allrC   rB   set_rng_stateset_rng_state_all_POOL_HANDLE)9r   r   r   r  r   r   r   r   r   r   r$   r   r1   r   r   r   r   r7   r   r   r  r  r   r   r   rP   r  r3   r9   r   r@   r<   r   r  r  r   r   r   r   r   r   r   r   r   r   r   r   rC   rB   r   r   r  r  r   r   streamsr   )Tr   rT   )r6   )rr   	threadingrG   collections.abcr   	functoolsr   typingr   r   r   r   torch._Ctorch._utilsr   r	   torch.typesr
   _utilsr   graphsr   r   r   r   r   r
  r   r   r>   localrZ   Lockr[   r   r   r   rb   r   r   r    r?   rE   r   	Generatorr   r"   r#   _xpu_exchangeDevicer*   _xpu_maybeExchangeDevicer-   r   r1   r3   r9   r<   r@   rM   rP   rO   rj   r$   r   r   r   r   r   r7   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   memoryr   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r  randomr  r  r  r  r  rC   rB   r  r  r	  __all__r   r   r   <module>r     s9             $ $ $ $ $ $       ) ) ) ) ) ) ) ) ) )   6 6 6 6 6 6 6 6       % % % % % %              # " " " " " " " y%y~''   t	(2t8
d3i
'(    '%($6FF%%'' 02 E%(,- 2 2 2d    
 <>> N 88x3"X> ';'=>>N N N N N NNs Ns N N N N 1*c * * * *d     4 4    U4 U U U U2 2 2
G G G G   % % % %P
 
 
 
 
 
 
 
       (       
(v 
($ 
( 
( 
( 
(. .F .c . . . . 4 & DcN    2 '* '*'*'* '* '* '*T% % % % %
c	EL0 
U\ 
 
 
 
;6 ; ;D ; ; ; ; (3 (3 (3 (3 (3 (3 (3 (3V!8./ !M ! ! ! !   v $    & 6 V    $ s F f    2
- 
- 
-$ 
- 
- 
- 
-tCy    =3 = = = =	-5< 	-EH,> 	- 	- 	- 	- 5: sU\1	   &* *#)el": *s * * * *"                                     &
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 w~uS#X77: : :r   