o
    H&i                     @   sn  d dl Z d dlZd dlmZmZmZ d dlZg dZd Z	dd Z
dd Zdd	 Zd
d Zdeejeej f ddfddZde	ddfddZdd e	ddfdddeej deeejeej f  dededeeejj  deeej  ddfddZ	d deej deddfddZ		d!deej deej ddfddZe	ddfdeej deej deddfddZdS )"    N)OptionalSequenceUnion)
all_reducereduce	broadcast
all_gatherreduce_scatterc                 C   st   t tjdstd dS t }| D ]%}|jr dS | s! dS |js' dS |	 }||v r2 dS |
| qdS )N_nccl_all_reducez)PyTorch is not compiled with NCCL supportFT)hasattrtorch_CwarningswarnsetZ	is_sparseZis_contiguousZis_cudaZ
get_deviceadd)ZtensorsZdevicesZtensorZdevice r   :C:\wamp64\www\opt\env\Lib\site-packages\torch/cuda/nccl.pyis_available   s    
r   c                  C   sT   t j } | d? }| d? d@ }| d@ }t j d}|dkr$|||fS ||||fS )N       i  zutf-8 )r   r   Z_nccl_versionZ_nccl_version_suffixdecode)vermajorminorpatchsuffixr   r   r   version"   s   

r   c                   C   s
   t j S N)r   r   Z_nccl_unique_idr   r   r   r   	unique_id.   s   
r    c                 C   s   t j| ||S r   )r   r   Z_nccl_init_rank)Z	num_ranksuidZrankr   r   r   	init_rank2   s   r"   inputsreturnc                 C   s&   t | tjjrt | tjrtdd S )Nz(Inputs should be a collection of tensors)
isinstancecollectionsabc	Containerr   Tensor	TypeError)r#   r   r   r   _check_sequence_type6   s
   r+   c                 C   s4   t |  |d u r
| }t | tj| |||| d S r   )r+   r   r   r
   r#   outputsopstreamscommsr   r   r   r   =   s
   r   )r-   outputrootr.   r/   r-   c                C   s   t |  |d ur|d urtdtd || }n!t|tjs1t|tjj	r1td || }n
|d u r9| | n|}tj
| ||||| d S )Nz'output' and 'outputs' can not be both specified. 'outputs' is deprecated in favor of 'output', taking in a single output tensor. The signature of reduce is: reduce(inputs, output=None, root=0, op=SUM, streams=None, comms=None).znccl.reduce with an output tensor list is deprecated. Please specify a single output tensor with argument 'output' instead instead.z\nccl.reduce with an output tensor list is deprecated. Please specify a single output tensor.)r+   
ValueErrorr   r   r%   r   r)   r&   r'   r   r   Z_nccl_reduce)r#   r1   r2   r.   r/   r0   r-   _outputr   r   r   r   G   s&   


r   c                 C   s   t |  tj| ||| d S r   )r+   r   r   Z_nccl_broadcast)r#   r2   r/   r0   r   r   r   r   n   s   r   c                 C   s&   t |  t | tj| ||| d S r   )r+   r   r   Z_nccl_all_gather)r#   r-   r/   r0   r   r   r   r   u   s   r   c                 C   s(   t |  t | tj| |||| d S r   )r+   r   r   Z_nccl_reduce_scatterr,   r   r   r   r	      s   r	   )r   NN)NN)r&   r   typingr   r   r   Z
torch.cudar   __all__ZSUMr   r   r    r"   r)   r+   r   intcudaZStreamr   r   r   r	   r   r   r   r   <module>   s~    "	
(


