
    ̩hK%                     T   d dl Z d dlZd dlmZ  eej
                  d      s> ed      ej
                  j                  d<    ed      ej
                  j                  d<    G d dej
                  j                        Z G d de      Z	 G d	 d
ej
                  j                        Zy)    N)_dummy_type_CudaStreamBase_CudaEventBasec                        e Zd ZdZd fd	ZddZddZddZdef fdZ	d fdZ
ed	        Zdef fd
Zd Zd Z xZS )Streama  Wrapper around a CUDA stream.

    A CUDA stream is a linear sequence of execution that belongs to a specific
    device, independent from other streams. It supports with statement as a
    context manager to ensure the operators within the with block are running
    on the corresponding stream.  See :ref:`cuda-semantics` for details.

    Args:
        device(torch.device or int, optional): a device on which to allocate
            the stream. If :attr:`device` is ``None`` (default) or a negative
            integer, this will use the current device.
        priority(int, optional): priority of the stream, which can be positive, 0, or negative.
            A lower number indicates a higher priority. By default, the priority is set to 0.
            If the value falls outside of the allowed priority range, it will automatically be
            mapped to the nearest valid priority (lowest for large positive numbers or
            highest for large negative numbers).

    c                     |d|v rd|v rt        |   | fd|i|S t        j                  j	                  |      5  t        |   | fd|i|cd d d        S # 1 sw Y   y xY w)N	stream_iddevice_indexpriority)super__new__torchcudadevice)clsr   r   kwargs	__class__s       P/var/www/html/eduruby.in/venv/lib/python3.12/site-packages/torch/cuda/streams.pyr   zStream.__new__"   sp    >kV3&8P7?3DDVDD""6* IwsHXHHI I Is   AA"returnc                 &    |j                  |        y)a  Make all future work submitted to the stream wait for an event.

        Args:
            event (torch.cuda.Event): an event to wait for.

        .. note:: This is a wrapper around ``cudaStreamWaitEvent()``: see
           `CUDA Stream documentation`_ for more info.

           This function returns without waiting for :attr:`event`: only future
           operations are affected.

        .. _CUDA Stream documentation:
           https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__STREAM.html
        N)waitselfevents     r   
wait_eventzStream.wait_event*   s     	

4    c                 B    | j                  |j                                y)a  Synchronize with another stream.

        All future work submitted to this stream will wait until all kernels
        submitted to a given stream at the time of call complete.

        Args:
            stream (Stream): a stream to synchronize.

        .. note:: This function returns without waiting for currently enqueued
           kernels in :attr:`stream`: only future operations are affected.
        N)r   record_event)r   streams     r   wait_streamzStream.wait_stream;   s     	++-.r   c                 @    |
t               }|j                  |        |S )zRecord an event.

        Args:
            event (torch.cuda.Event, optional): event to record. If not given, a new one
                will be allocated.

        Returns:
            Recorded event.
        )Eventrecordr   s     r   r   zStream.record_eventI   s!     =GETr   c                      t         |          S )zCheck if all the work submitted has been completed.

        Returns:
            A boolean indicating if all kernels in this stream are completed.
        r   queryr   r   s    r   r&   zStream.queryX   s     w}r   c                 "    t         |           y)zWait for all the kernels in this stream to complete.

        .. note:: This is a wrapper around ``cudaStreamSynchronize()``: see
           `CUDA Stream documentation`_ for more info.
        Nr   synchronizer'   s    r   r*   zStream.synchronize`   s     	r   c                 @    t        j                  | j                        S N)ctypesc_void_pcuda_streamr   s    r   _as_parameter_zStream._as_parameter_h   s    t//00r   c                 D    t        |t              rt        |   |      S y)NF)
isinstancer   r   __eq__)r   or   s     r   r4   zStream.__eq__l   s    a 7>!$$r   c                 D    t        | j                  | j                  f      S r,   )hashr/   r   r0   s    r   __hash__zStream.__hash__q   s    T%%t{{344r   c                 >    d| j                    d| j                  ddS )Nz<torch.cuda.Stream device=z cuda_stream=#x>)r   r/   r0   s    r   __repr__zStream.__repr__t   s&    +DKK=dFVFVWYEZZ[\\r   )Nr   r   Nr,   )__name__
__module____qualname____doc__r   r   r    r   boolr&   r*   propertyr1   r4   r8   r<   __classcell__r   s   @r   r   r      sY    &I"/t  1 14 
5]r   r   c                   $     e Zd ZdZd fd	Z xZS )ExternalStreama  Wrapper around an externally allocated CUDA stream.

    This class is used to wrap streams allocated in other libraries in order
    to facilitate data exchange and multi-library interactions.

    .. note:: This class doesn't manage the stream life-cycle, it is the user
       responsibility to keep the referenced stream alive while this class is
       being used.

    Args:
        stream_ptr(int): Integer representation of the `cudaStream_t` value.
            allocated externally.
        device(torch.device or int, optional): the device where the stream
            was originally allocated. If device is specified incorrectly,
            subsequent launches using this stream may fail.
    c                     t         j                  j                  |      5  t        |   | fd|i|cd d d        S # 1 sw Y   y xY w)N
stream_ptr)r   r   r   r   r   )r   rI   r   r   r   s       r   r   zExternalStream.__new__   sD    ZZv& 	I7?3H:HH	I 	I 	Is	   =Ar,   )r>   r?   r@   rA   r   rD   rE   s   @r   rG   rG   x   s    "I Ir   rG   c                        e Zd ZdZ	 d fd	Ze fd       Zd fd	Zdd fdZ fdZ	 fdZ
d fd	Z fd
Zed        ZdefdZ xZS )r"   a  Wrapper around a CUDA event.

    CUDA events are synchronization markers that can be used to monitor the
    device's progress, to accurately measure timing, and to synchronize CUDA
    streams.

    The underlying CUDA events are lazily initialized when the event is first
    recorded or exported to another process. After creation, only streams on the
    same device may record the event. However, streams on any device can wait on
    the event.

    Args:
        enable_timing (bool, optional): indicates if the event should measure time
            (default: ``False``)
        blocking (bool, optional): if ``True``, :meth:`wait` will be blocking (default: ``False``)
        interprocess (bool): if ``True``, the event can be shared between processes
            (default: ``False``)
        external (bool, optional): indicates whether this event should create event record and event wait nodes, or create an internal cross-stream dependency, when captured in a cuda graph. See `cross-stream dependencies <https://docs.nvidia.com/cuda/archive/12.9.0/cuda-c-programming-guide/index.html#cross-stream-dependencies-and-events>`_, `cudaEventRecordExternal <https://docs.nvidia.com/cuda/archive/12.9.0/cuda-runtime-api/group__CUDART__TYPES.html#group__CUDART__TYPES_1g3457b81d1d32c6a00f6132fbc2693d47>`_, and `cudaEventWaitExternal <https://docs.nvidia.com/cuda/archive/12.9.0/cuda-runtime-api/group__CUDART__TYPES.html#group__CUDART__TYPES_1g0c23426b7252eaa9cef695859991304e>`_ for more information about internal vs. external events. (default: ``False``)

    .. _CUDA Event Documentation:
       https://docs.nvidia.com/cuda/cuda-runtime-api/group__CUDART__EVENT.html
    c                 ,    t         |   | ||||      S )N)enable_timingblockinginterprocessexternal)r   r   )r   rL   rM   rN   rO   r   s        r   r   zEvent.__new__   s*     w'%  
 	
r   c                 $    t         |   ||      S )z<Reconstruct an event from an IPC handle on the given device.)r   from_ipc_handle)r   r   handler   s      r   rQ   zEvent.from_ipc_handle   s     w&vv66r   c                 d    |t         j                  j                         }t        |   |       y)zRecord the event in a given stream.

        Uses ``torch.cuda.current_stream()`` if no stream is specified. The
        stream's device must match the event's device.
        N)r   r   current_streamr   r#   r   r   r   s     r   r#   zEvent.record   s(     >ZZ..0Fvr   r   c                 d    |t         j                  j                         }t        |   |       y)a  Make all future work submitted to the given stream wait for this event.

        Use ``torch.cuda.current_stream()`` if no stream is specified.

        .. note:: This is a wrapper around ``cudaStreamWaitEvent()``: see
            `CUDA Event documentation`_ for more info.
        N)r   r   rT   r   r   rU   s     r   r   z
Event.wait   s(     >ZZ..0FVr   c                      t         |          S )zCheck if all work currently captured by event has completed.

        Returns:
            A boolean indicating if all work currently captured by event has
            completed.
        r%   r'   s    r   r&   zEvent.query   s     w}r   c                 "    t         |   |      S )zReturn the time elapsed.

        Time reported in milliseconds after the event was recorded and
        before the end_event was recorded.
        )r   elapsed_time)r   	end_eventr   s     r   rY   zEvent.elapsed_time   s     w#I..r   c                 "    t         |           y)aN  Wait for the event to complete.

        Waits until the completion of all work currently captured in this event.
        This prevents the CPU thread from proceeding until the event completes.

         .. note:: This is a wrapper around ``cudaEventSynchronize()``: see
            `CUDA Event documentation`_ for more info.
        Nr)   r'   s    r   r*   zEvent.synchronize   s     	r   c                      t         |          S )zqReturn an IPC handle of this event.

        If not recorded yet, the event will use the current device.
        )r   
ipc_handler'   s    r   r]   zEvent.ipc_handle   s    
 w!##r   c                 @    t        j                  | j                        S r,   )r-   r.   
cuda_eventr0   s    r   r1   zEvent._as_parameter_   s    t//r   c                 R    | j                   rd| j                  j                  ddS y)Nz<torch.cuda.Event r:   r;   z <torch.cuda.Event uninitialized>)r_   r1   valuer0   s    r   r<   zEvent.__repr__   s*    ??'(;(;(A(A"'EQGG5r   )FFFFr,   r=   )r>   r?   r@   rA   r   classmethodrQ   r#   r   r&   rY   r*   r]   rC   r1   strr<   rD   rE   s   @r   r"   r"      sf    0 PU	
 7 7
/	$ 0 06# 6r   r"   )r-   r   torch._utilsr   hasattr_C__dict__r   r   rG   r   r"    r   r   <module>ri      s      $ uxx*++67H+IEHH'(*56F*GEHH&'g]UXX%% g]TIV I.i6EHH## i6r   