o
    ¡…›im3  ã                   @   sÊ  d dl Z d dlZd dlmZmZ d dlZd dlmZ d dlm	Z	 ddl
mZmZmZmZ eƒ s7edƒejjd< ee	eedf Zd-d	d
„Zd.deddfdd„Zd.deddfdd„Zd.dedeeef fdd„Zd.dedeeef fdd„Zd.dedefdd„Zd.dedefdd„Zd.dedefdd„Zd.dedefdd„Zd.dedeeef fdd„Zd.dede fdd„Z!d.d e deddfd!d"„Z"G d#d$„ d$ƒZ#G d%d&„ d&e#ƒZ$d'e#ddfd(d)„Z%de#fd*d+„Z&g d,¢Z'dS )/é    N)ÚAnyÚUnion)Ú_dummy_type)ÚDeviceé   )Ú_get_device_indexÚ_is_compiledÚ
_lazy_initÚis_initializedÚ_xpu_XPUAllocatorÚreturnc                   C   s   t ƒ r
tj ¡  dS dS )aZ  Release all unoccupied cached memory currently held by the caching
    allocator so that those can be used in other XPU application.

    .. note::
        :func:`~torch.xpu.empty_cache` doesn't increase the amount of XPU
        memory available for PyTorch. However, it may help reduce fragmentation
        of XPU memory in certain cases.
    N)r
   ÚtorchÚ_CÚ_xpu_emptyCache© r   r   úR/sda-disk/www/egybert/egybert_env/lib/python3.10/site-packages/torch/xpu/memory.pyÚempty_cache   s   	ÿr   Údevicec                 C   ó   t | dd} tj | ¡S )a¬  Reset the "peak" stats tracked by the XPU memory allocator.

    See :func:`~torch.xpu.memory_stats` for details. Peak stats correspond to the
    `"peak"` key in each individual stat dict.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    T©Úoptional)r   r   r   Ú_xpu_resetPeakMemoryStats©r   r   r   r   Úreset_peak_memory_stats    ó   r   c                 C   r   )aÛ  Reset the "accumulated" (historical) stats tracked by the XPU memory allocator.

    See :func:`~torch.xpu.memory_stats` for details. Accumulated stats correspond to
    the `"allocated"` and `"freed"` keys in each individual stat dict.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    Tr   )r   r   r   Ú _xpu_resetAccumulatedMemoryStatsr   r   r   r   Úreset_accumulated_memory_stats/   r   r   c                 C   s"   t ƒ si S t| dd} tj | ¡S )zLReturn the result of :func:`~torch.xpu.memory_stats` as a nested dictionary.Tr   )r
   r   r   r   Ú_xpu_memoryStatsr   r   r   r   Úmemory_stats_as_nested_dict>   s   r   c                    sF   g ‰dt dtddf‡ ‡fdd„‰ t| d}ˆ d|ƒ ˆ ¡  t ˆ¡S )	a@  Return a dictionary of XPU memory allocator statistics for a given device.

    The return value of this function is a dictionary of statistics, each of
    which is a non-negative integer.

    Core statistics:

    - ``"allocated_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of allocated memory.
    - ``"reserved_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of reserved memory.
    - ``"active_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      amount of active memory.
    - ``"requested_bytes.{all,large_pool,small_pool}.{current,peak,allocated,freed}"``:
      memory requested by client code, compare this with allocated_bytes to check if
      allocation rounding adds too much overhead.

    For these core statistics, values are broken down as follows.

    Pool type:

    - ``all``: combined statistics across all memory pools.
    - ``large_pool``: statistics for the large allocation pool (for size >= 1MB allocations).
    - ``small_pool``: statistics for the small allocation pool (for size < 1MB allocations).

    Metric type:

    - ``current``: current value of this metric.
    - ``peak``: maximum value of this metric.
    - ``allocated``: historical total increase in this metric.
    - ``freed``: historical total decrease in this metric.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistics for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    ÚprefixÚobjr   Nc                    sT   t |tƒr!t| ƒdkr| d7 } | ¡ D ]\}}ˆ | | |ƒ qd S ˆ | |f¡ d S )Nr   Ú.)Ú
isinstanceÚdictÚlenÚitemsÚappend)r   r    ÚkÚv©Ú_recurse_add_to_resultÚresultr   r   r*   n   s   
ÿz,memory_stats.<locals>._recurse_add_to_resultr   Ú )Ústrr   r   ÚsortÚcollectionsÚOrderedDict)r   Ústatsr   r)   r   Úmemory_statsF   s   &
	

r2   c                 C   ó   t | d dd¡S )a  Return the current GPU memory occupied by tensors in bytes for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).

    .. note::
        This is likely less than the amount shown in `xpu-smi` since some
        unused memory can be held by the caching allocator and some context
        needs to be created on GPU.
    r   zallocated_bytes.all.currentr   ©r2   Úgetr   r   r   r   Úmemory_allocated~   s   r6   c                 C   r3   )a‰  Return the maximum GPU memory occupied by tensors in bytes for a given device.

    By default, this returns the peak allocated memory since the beginning of
    this program. :func:`~torch.xpu.reset_peak_memory_stats` can be used to
    reset the starting point in tracking this metric. For example, these two
    functions can measure the peak allocated memory usage of each iteration in a
    training loop.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zallocated_bytes.all.peakr   r4   r   r   r   r   Úmax_memory_allocatedŽ   ó   r7   c                 C   r3   )aJ  Return the current GPU memory managed by the caching allocator in bytes for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zreserved_bytes.all.currentr   r4   r   r   r   r   Úmemory_reservedŸ   s   r9   c                 C   r3   )a‘  Return the maximum GPU memory managed by the caching allocator in bytes for a given device.

    By default, this returns the peak cached memory since the beginning of this
    program. :func:`~torch.xpu.reset_peak_memory_stats` can be used to reset
    the starting point in tracking this metric. For example, these two functions
    can measure the peak cached memory amount of each iteration in a training
    loop.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).
    r   zreserved_bytes.all.peakr   r4   r   r   r   r   Úmax_memory_reservedª   r8   r:   c                 C   ó   t ƒ  t| dd} tj | ¡S )a½  Return the global free and total GPU memory for a given device.

    Args:
        device (torch.device or int or str, optional): selected device. Returns
            statistic for the current device, given by :func:`~torch.xpu.current_device`,
            if :attr:`device` is ``None`` (default).

    Returns:
        int: the memory available on the device in units of bytes.
        int: the total memory on the device in units of bytes
    Tr   )r	   r   r   r   Ú_xpu_getMemoryInfor   r   r   r   Úmem_get_info»   s   r=   c                 C   r;   )ab  
    Retrieve the memory fraction currently set for a process on a given XPU device.
    This fraction represents the portion of the total device memory that
    the caching allocator is allowed to use. The allowed memory is calculated as:

    .. math:: \text{allowed\_memory} = \text{total\_memory} \times \text{fraction}

    Args:
        device (torch.device or int or str, optional): selected device. It uses the current device,
            given by :func:`~torch.xpu.current_device`, if :attr:`device` is ``None`` (default).

    Returns:
        float: The memory fraction in the range 0.0 to 1.0.
    Tr   )r	   r   r   r   Ú_xpu_getMemoryFractionr   r   r   r   Úget_per_process_memory_fractionÌ   s   r?   Úfractionc                 C   s6   t ƒ  t|dd}t| tƒstdƒ‚tj | |¡ dS )a=  
    Set the memory fraction for a single process on XPU device.
    This function limits the amount of memory that the caching allocator can allocate
    on the specified XPU device. The allowed memory is computed as:

    .. math:: \text{allowed\_memory} = \text{total\_memory} \times \text{fraction}

    If the process attempts to allocate more than this allowed memory,
    an out-of-memory error will be raised by the allocator.

    Arguments:
        fraction (float): Range: 0~1. Allowed memory equals total_memory * fraction.
        device (torch.device or int or str, optional): selected device. It uses the current device,
            given by :func:`~torch.xpu.current_device`, if :attr:`device` is ``None`` (default).

    .. note:: In general, the total available free memory is less than the total capacity.
    Tr   z3Invalid type for fraction argument, must be `float`N)r	   r   r"   ÚfloatÚ	TypeErrorr   r   Ú_xpu_setMemoryFraction)r@   r   r   r   r   Úset_per_process_memory_fractionà   s
   
rD   c                   @   s*   e Zd ZdZdejjfdd„Zdd„ ZdS )Ú_XPUAllocatorz,Wrapper over internal XPU memory allocators.Ú	allocatorc                 C   s
   || _ d S ©N©Ú
_allocator)ÚselfrF   r   r   r   Ú__init__ý   s   
z_XPUAllocator.__init__c                 C   s   | j S rG   rH   )rJ   r   r   r   rF      s   z_XPUAllocator.allocatorN)	Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   r   rK   rF   r   r   r   r   rE   ú   s    rE   c                   @   s&   e Zd ZdZdededefdd„ZdS )ÚXPUPluggableAllocatorz2XPU memory allocator loaded from a shared library.Úpath_to_lib_fileÚalloc_fn_nameÚfree_fn_namec           	      C   sj   t  |¡}t||ƒ}t||ƒ}t  |t j¡j}t  |t j¡j}|du s'|du r+tdƒ‚tj 	||¡| _
dS )a  XPU memory allocator loaded dynamically from a shared library.

        This lets users provide custom allocation and free functions implemented
        in a separate shared library. The allocator is registered through
        ``torch._C._xpu_customAllocator`` and becomes available for use via
        ``torch.memory.xpu.change_current_allocator``.

        Arguments:
            path_to_lib_file (str):
                Filesystem path to the shared library file containing the allocation
                and free functions.
            alloc_fn_name (str):
                Name of the allocation function exported from the shared library.
                The function must have the signature:

                    ``void* alloc_fn(size_t size, int device, sycl::queue* queue);``

            free_fn_name (str):
                Name of the free function exported from the shared library.
                The function must have the signature:

                    ``void free_fn(void* ptr, size_t size, sycl::queue* queue);``
        Nz9Failed to load allocator symbols from the shared library.)ÚctypesÚCDLLÚgetattrÚcastÚc_void_pÚvalueÚRuntimeErrorr   r   Ú_xpu_customAllocatorrI   )	rJ   rQ   rR   rS   Úallocator_libÚalloc_fn_ptrÚfree_fn_ptrÚalloc_fn_addrÚfree_fn_addrr   r   r   rK     s   


ÿzXPUPluggableAllocator.__init__N)rL   rM   rN   rO   r-   rK   r   r   r   r   rP     s    rP   rF   c                 C   s   t j |  ¡ ¡ dS )a  Change the currently used memory allocator to be the one provided.

    .. note::
        If the current allocator has already been used/initialized, this function will error.

    Arguments:
        allocator (torch.xpu.memory._XPUAllocator): allocator to be set as the active one.
    N)r   r   Ú_xpu_changeCurrentAllocatorrF   )rF   r   r   r   Úchange_current_allocator/  s   	rb   c                   C   s   t tj ¡ ƒS )zxReturn the allocator being currently used.

    Returns:
        _XPUAllocator: the allocator being currently used.
    )rE   r   r   Ú_xpu_getAllocatorr   r   r   r   Ú_get_current_allocator;  s   rd   )rP   rb   r   r?   r7   r:   r=   r6   r9   r2   r   r   r   rD   )r   NrG   )(r/   rT   Útypingr   r   r   Útorch._utilsr   Útorch.typesr   r,   r   r   r	   r
   r   Ú__dict__r-   ÚintÚ	_device_tr   r   r   r#   r   r2   r6   r7   r9   r:   Útupler=   rA   r?   rD   rE   rP   rb   rd   Ú__all__r   r   r   r   Ú<module>   s6    
8
+