Ë
    ßò€im3  ã                   óø  — d dl Z d dlZd dlmZmZ d dlZd dlmZ d dlm	Z	 ddl
mZmZmZmZ  e«       s ed«      ej                  j                   d<   ee	eedf   Zdd	„Zd d
eddfd„Zd d
eddfd„Zd d
edeeef   fd„Zd d
edeeef   fd„Zd d
edefd„Zd d
edefd„Zd d
edefd„Zd d
edefd„Zd d
edeeef   fd„Zd d
ede fd„Z!d de d
eddfd„Z" G d„ d«      Z# G d„ de#«      Z$de#ddfd„Z%de#fd„Z&g d¢Z'y)!é    N)ÚAnyÚUnion)Ú_dummy_type)ÚDeviceé   )Ú_get_device_indexÚ_is_compiledÚ
_lazy_initÚis_initializedÚ_xpu_XPUAllocatorÚreturnc                  óV   — t        «       rt        j                  j                  «        yy)aZ  Release all unoccupied cached memory currently held by the caching
    allocator so that those can be used in other XPU application.

    .. note::
        :func:`~torch.xpu.empty_cache` doesn't increase the amount of XPU
        memory available for PyTorch. However, it may help reduce fragmentation
        of XPU memory in certain cases.
    N)r   ÚtorchÚ_CÚ_xpu_emptyCache© ó    úJ/var/www/html/engine/venv/lib/python3.12/site-packages/torch/xpu/memory.pyÚempty_cacher      s   € ô ÔÜ‰× Ñ Õ"ð r   Údevicec                 óZ   — t        | d¬«      } t        j                  j                  | «      S )a¬  Reset the "peak" stats tracked by the XPU memory allocator.

    See :func:`~torch.xpu.memory_stats` for details. Peak stats correspond to the
    `"peak"` key in each individual stat dict.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    T©Úoptional)r   r   r   Ú_xpu_resetPeakMemoryStats©r   s    r   Úreset_peak_memory_statsr       s%   € ô ˜v°Ô5€FÜ8‰8×-Ñ-¨fÓ5Ð5r   c                 óZ   — t        | d¬«      } t        j                  j                  | «      S )aÛ  Reset the "accumulated" (historical) stats tracked by the XPU memory allocator.

    See :func:`~torch.xpu.memory_stats` for details. Accumulated stats correspond to
    the `"allocated"` and `"freed"` keys in each individual stat dict.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    Tr   )r   r   r   Ú _xpu_resetAccumulatedMemoryStatsr   s    r   Úreset_accumulated_memory_statsr   /   s%   € ô ˜v°Ô5€FÜ8‰8×4Ñ4°VÓ<Ð<r   c                 ór   — t        «       si S t        | d¬«      } t        j                  j	                  | «      S )zLReturn the result of :func:`~torch.xpu.memory_stats` as a nested dictionary.Tr   )r   r   r   r   Ú_xpu_memoryStatsr   s    r   Úmemory_stats_as_nested_dictr"   >   s.   € äÔØˆ	Ü˜v°Ô5€FÜ8‰8×$Ñ$ VÓ,Ð,r   c                 ó¨   ‡‡— g Šdt         dt        ddfˆˆfd„Št        | ¬«      } ‰d|«       ‰j                  «        t	        j
                  ‰«      S )a@  Return a dictionary of XPU memory allocator statistics for a given device.

    The return value of this function is a dictionary of statistics, each of
    which is a non-negative integer.

    Core statistics:

    - ``"allocated_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of allocated memory.
    - ``"reserved_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of reserved memory.
    - ``"active_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of active memory.
    - ``"requested_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      memory requested by client code, compare this with allocated_bytes to check if
      allocation rounding adds too much overhead.

    For these core statistics, values are broken down as follows.

    Pool type:

    - ``all``: combined statistics across all memory pools.
    - ``large_pool``: statistics for the large allocation pool (for size >= 1MB allocations).
    - ``small_pool``: statistics for the small allocation pool (for size < 1MB allocations).

    Metric type:

    - ``current``: current value of this metric.
    - ``peak``: maximum value of this metric.
    - ``allocated``: historical total increase in this metric.
    - ``freed``: historical total decrease in this metric.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistics for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    ÚprefixÚobjr   Nc                 ó¼   •— t        |t        «      r8t        | «      dkD  r| dz  } |j                  «       D ]  \  }} ‰| |z   |«       Œ y ‰j	                  | |f«       y )Nr   ú.)Ú
isinstanceÚdictÚlenÚitemsÚappend)r$   r%   ÚkÚvÚ_recurse_add_to_resultÚresults       €€r   r/   z,memory_stats.<locals>._recurse_add_to_resultn   sZ   ø€ Ücœ4Ô Ü6‹{˜QŠØ˜#‘ØŸ	™	›ò 6‘1Ù& v°¡z°1Õ5ñ6ð M‰M˜6 3˜-Õ(r   r   Ú )Ústrr   r"   ÚsortÚcollectionsÚOrderedDict)r   Ústatsr/   r0   s     @@r   Úmemory_statsr7   F   sU   ù€ ðL €Fð)¤sð )´ð )¸ö )ô (¨vÔ6€EÙ˜2˜uÔ%Ø
‡KK„Mä×"Ñ" 6Ó*Ð*r   c                 ó:   — t        | ¬«      j                  dd«      S )a  Return the current GPU memory occupied by tensors in bytes for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).

    .. note::
        This is likely less than the amount shown in `xpu-smi` since some
        unused memory can be held by the caching allocator and some context
        needs to be created on GPU.
    r   zallocated_bytes.all.currentr   ©r7   Úgetr   s    r   Úmemory_allocatedr;   ~   s   € ô ˜vÔ&×*Ñ*Ð+HÈ!ÓLÐLr   c                 ó:   — t        | ¬«      j                  dd«      S )a‰  Return the maximum GPU memory occupied by tensors in bytes for a given device.

    By default, this returns the peak allocated memory since the beginning of
    this program. :func:`~torch.xpu.reset_peak_memory_stats` can be used to
    reset the starting point in tracking this metric. For example, these two
    functions can measure the peak allocated memory usage of each iteration in a
    training loop.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zallocated_bytes.all.peakr   r9   r   s    r   Úmax_memory_allocatedr=   Ž   s   € ô ˜vÔ&×*Ñ*Ð+EÀqÓIÐIr   c                 ó:   — t        | ¬«      j                  dd«      S )aJ  Return the current GPU memory managed by the caching allocator in bytes for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zreserved_bytes.all.currentr   r9   r   s    r   Úmemory_reservedr?   Ÿ   s   € ô ˜vÔ&×*Ñ*Ð+GÈÓKÐKr   c                 ó:   — t        | ¬«      j                  dd«      S )a‘  Return the maximum GPU memory managed by the caching allocator in bytes for a given device.

    By default, this returns the peak cached memory since the beginning of this
    program. :func:`~torch.xpu.reset_peak_memory_stats` can be used to reset
    the starting point in tracking this metric. For example, these two functions
    can measure the peak cached memory amount of each iteration in a training
    loop.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zreserved_bytes.all.peakr   r9   r   s    r   Úmax_memory_reservedrA   ª   s   € ô ˜vÔ&×*Ñ*Ð+DÀaÓHÐHr   c                 ón   — t        «        t        | d¬«      } t        j                  j	                  | «      S )a½  Return the global free and total GPU memory for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).

    Returns:
        int: the memory available on the device in units of bytes.
        int: the total memory on the device in units of bytes
    Tr   )r
   r   r   r   Ú_xpu_getMemoryInfor   s    r   Úmem_get_inforD   »   s*   € ô „LÜ˜v°Ô5€FÜ8‰8×&Ñ& vÓ.Ð.r   c                 ón   — t        «        t        | d¬«      } t        j                  j	                  | «      S )ab  
    Retrieve the memory fraction currently set for a process on a given XPU device.
    This fraction represents the portion of the total device memory that
    the caching allocator is allowed to use. The allowed memory is calculated as:

    .. math:: \text{allowed\_memory} = \text{total\_memory} \times \text{fraction}

    Args:
        device (torch.device or int or str, optional): selected device. It uses the current device,
            given by :func:`~torch.xpu.current_device`, if :attr:`device` is ``None`` (default).

    Returns:
        float: The memory fraction in the range 0.0 to 1.0.
    Tr   )r
   r   r   r   Ú_xpu_getMemoryFractionr   s    r   Úget_per_process_memory_fractionrG   Ì   s*   € ô „LÜ˜v°Ô5€FÜ8‰8×*Ñ*¨6Ó2Ð2r   Úfractionc                 ó¨   — t        «        t        |d¬«      }t        | t        «      st	        d«      ‚t
        j                  j                  | |«       y)a=  
    Set the memory fraction for a single process on XPU device.
    This function limits the amount of memory that the caching allocator can allocate
    on the specified XPU device. The allowed memory is computed as:

    .. math:: \text{allowed\_memory} = \text{total\_memory} \times \text{fraction}

    If the process attempts to allocate more than this allowed memory,
    an out-of-memory error will be raised by the allocator.

    Arguments:
        fraction (float): Range: 0~1. Allowed memory equals total_memory * fraction.
        device (torch.device or int or str, optional): selected device. It uses the current device,
            given by :func:`~torch.xpu.current_device`, if :attr:`device` is ``None`` (default).

    .. note:: In general, the total available free memory is less than the total capacity.
    Tr   z3Invalid type for fraction argument, must be `float`N)r
   r   r(   ÚfloatÚ	TypeErrorr   r   Ú_xpu_setMemoryFraction)rH   r   s     r   Úset_per_process_memory_fractionrM   à   s?   € ô$ „LÜ˜v°Ô5€FÜh¤Ô&ÜÐMÓNÐNä	‡HH×#Ñ# H¨fÕ5r   c                   óJ   — e Zd ZdZdej
                  j                  fd„Zd„ Zy)Ú_XPUAllocatorz,Wrapper over internal XPU memory allocators.Ú	allocatorc                 ó   — || _         y ©N©Ú
_allocator)ÚselfrP   s     r   Ú__init__z_XPUAllocator.__init__ý   s	   € Ø#ˆr   c                 ó   — | j                   S rR   rS   )rU   s    r   rP   z_XPUAllocator.allocator   s   € Ø‰Ðr   N)	Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   r   rV   rP   r   r   r   rO   rO   ú   s    „ Ù7ð$ %§(¡(×"<Ñ"<ó $ór   rO   c                   ó$   — e Zd ZdZdededefd„Zy)ÚXPUPluggableAllocatorz2XPU memory allocator loaded from a shared library.Úpath_to_lib_fileÚalloc_fn_nameÚfree_fn_namec                 ó~  — t        j                  |«      }t        ||«      }t        ||«      }t        j                  |t         j                  «      j
                  }t        j                  |t         j                  «      j
                  }||€t        d«      ‚t        j                  j                  ||«      | _
        y)a  XPU memory allocator loaded dynamically from a shared library.

        This lets users provide custom allocation and free functions implemented
        in a separate shared library. The allocator is registered through
        ``torch._C._xpu_customAllocator`` and becomes available for use via
        ``torch.memory.xpu.change_current_allocator``.

        Arguments:
            path_to_lib_file (str):
                Filesystem path to the shared library file containing the allocation
                and free functions.
            alloc_fn_name (str):
                Name of the allocation function exported from the shared library.
                The function must have the signature:

                    ``void* alloc_fn(size_t size, int device, sycl::queue* queue);``

            free_fn_name (str):
                Name of the free function exported from the shared library.
                The function must have the signature:

                    ``void free_fn(void* ptr, size_t size, sycl::queue* queue);``
        Nz9Failed to load allocator symbols from the shared library.)ÚctypesÚCDLLÚgetattrÚcastÚc_void_pÚvalueÚRuntimeErrorr   r   Ú_xpu_customAllocatorrT   )	rU   r^   r_   r`   Úallocator_libÚalloc_fn_ptrÚfree_fn_ptrÚalloc_fn_addrÚfree_fn_addrs	            r   rV   zXPUPluggableAllocator.__init__  s”   € ô0 Ÿ™Ð$4Ó5ˆä˜}¨mÓ<ˆÜ˜m¨\Ó:ˆäŸ™ L´&·/±/ÓB×HÑHˆÜ—{‘{ ;´·±Ó@×FÑFˆàÐ  LÐ$8ÜØKóð ô  Ÿ(™(×7Ñ7¸À|ÓTˆr   N)rX   rY   rZ   r[   r2   rV   r   r   r   r]   r]     s$   „ Ù=ð%U¨ð %U¸Sð %UÐPSô %Ur   r]   rP   c                 ó^   — t         j                  j                  | j                  «       «       y)a  Change the currently used memory allocator to be the one provided.

    .. note::
        If the current allocator has already been used/initialized, this function will error.

    Arguments:
        allocator (torch.xpu.memory._XPUAllocator): allocator to be set as the active one.
    N)r   r   Ú_xpu_changeCurrentAllocatorrP   )rP   s    r   Úchange_current_allocatorrq   /  s   € ô 
‡HH×(Ñ(¨×)<Ñ)<Ó)>Õ?r   c                  óP   — t        t        j                  j                  «       «      S )zxReturn the allocator being currently used.

    Returns:
        _XPUAllocator: the allocator being currently used.
    )rO   r   r   Ú_xpu_getAllocatorr   r   r   Ú_get_current_allocatorrt   ;  s   € ô œŸ™×3Ñ3Ó5Ó6Ð6r   )r]   rq   r   rG   r=   rA   rD   r;   r?   r7   r"   r   r   rM   )r   NrR   )(r4   rb   Útypingr   r   r   Útorch._utilsr   Útorch.typesr   r1   r   r	   r
   r   r   Ú__dict__r2   ÚintÚ	_device_tr   r   r   r)   r"   r7   r;   r=   r?   rA   ÚtuplerD   rJ   rG   rM   rO   r]   rq   rt   Ú__all__r   r   r   ú<module>r}      s—  ðÛ Û ß ã Ý $Ý ç IÓ Iñ „~á-8Ð9LÓ-M€E‡HH×ÑÐ)Ñ*à&˜#˜s DÐ(Ñ)€	ó
#ñ6 Ið 6¸ó 6ñ=¨9ð =Àó =ñ-¨	ð -¸TÀ#ÀsÀ(¹^ó -ñ5+˜ð 5+¨d°3¸°8©nó 5+ñpM˜Yð M°#ó Mñ J ð J°có Jñ"L˜Ið L°ó LñI 	ð I°Só Iñ"/˜ð /¨e°C¸°H©oó /ñ"3¨Ið 3Àó 3ñ(6¨eð 6¸Yð 6ÐRVó 6÷4ñ ô(U˜Mô (UðV	@¨ð 	@¸$ó 	@ð7 ó 7òr   