U
    yâhj  ã                	   @   s‚  U d dl mZmZ d dlmZmZmZmZ d dlZd dl	m
Z d dlmZ d dlmZ d dlmZmZ d dlmZmZmZ G dd	„ d	eƒZdaee ed
< eddœdd„Zdejee eejee f dœdd„Zd ejeee ejdœdd„Zd!ejeeeejee ejdœdd„Z d"ejeeee ejdœdd„Z!d#ejee eejee f dœdd„Z"d$eee ee ejdœdd„Z#dS )%é    )ÚABCÚabstractmethod)ÚAnyÚListÚOptionalÚTupleN)ÚShardedTensor)ÚShard)Ú
DeviceMeshÚDTensor)Ú_all_gather_dtensorÚ_create_chunk_dtensorÚ_create_chunk_sharded_tensorc                
   @   sÖ   e Zd ZdZeejeejee	 f dœdd„ƒZ
eeje	ejdœdd„ƒZedejeeeejeej ejd	œd
d„ƒZeejeeejdœdd„ƒZeejeejee f dœdd„ƒZeeee ejdœdd„ƒZdS )ÚFSDPExtensionszä
    This enables some customizable hooks to enable composability with tensor
    parallelism. To activate these hooks, use :func:`_set_fsdp_extensions` to
    set a custom :class:`FSDPExtensions` that implements the hooks.
    )ÚtensorÚreturnc                 C   s   dS )z6E.g. converting ``DistributedTensor`` to local tensor.N© ©Úselfr   r   r   úY/var/www/html/venv/lib/python3.8/site-packages/torch/distributed/fsdp/_fsdp_extensions.pyÚpre_flatten_transform   s    z$FSDPExtensions.pre_flatten_transform)r   Úparam_extensionr   c                 C   s   dS )z6E.g. converting local tensor to ``DistributedTensor``.Nr   )r   r   r   r   r   r   Úpost_unflatten_transform   s    z'FSDPExtensions.post_unflatten_transformN)r   ÚrankÚ
world_sizeÚnum_devices_per_nodeÚpgÚdevicer   c                 C   s   dS )z6Shards a tensor to chunks and returns the local chunk.Nr   )r   r   r   r   r   r   r   r   r   r   Úchunk_tensor(   s    zFSDPExtensions.chunk_tensor)r   r   Údevice_meshr   c                 C   s   dS )zAShards a tensor/DTensor to DTensor and returns the local DTensor.Nr   )r   r   r   r   r   r   r   Úchunk_dtensor5   s    zFSDPExtensions.chunk_dtensorc                 C   s   dS )z£
        This is to be called before loading a *sharded* model state dict and
        should return the tensor and list of shards from which to load data.
        Nr   r   r   r   r   Úpre_load_state_dict_transform?   s    	z,FSDPExtensions.pre_load_state_dict_transform)r   Úparent_meshr   c                 C   s   dS )z³
        This is to be called before loading a *sharded* DTensor state dict.
        This gathers tensor in FSDP dimension and returns local tensor of
        TP DTensor.
        Nr   )r   r   r"   r   r   r   Úall_gather_dtensorJ   s    z!FSDPExtensions.all_gather_dtensor)N)Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   ÚtorchÚTensorr   r   r   r   r   ÚintÚdistÚProcessGroupr   r   r
   r    r   r	   r!   r   r#   r   r   r   r   r      sH   ýü ùøû	ý
ür   Ú_extensions)Ú	flattenerr   c                 C   s   | a d S ©N)r-   )r.   r   r   r   Ú_set_fsdp_extensions[   s    r0   )r   Úfsdp_extensionr   c                 C   s.   |d k	r&|  | ¡\}}|d k	r&||fS | d fS r/   )r   )r   r1   Z
new_tensorr   r   r   r   Ú_ext_pre_flatten_transform`   s
    r2   )r   r   r1   r   c                 C   s    |d k	r|d k	r|  | |¡S | S r/   )r   )r   r   r1   r   r   r   Ú_ext_post_unflatten_transformk   s    r3   )r   r   r   r   r   r1   r   c                 C   s"   |d k	r|j nt}|| ||||ƒS r/   )r   r   )r   r   r   r   r   r1   Zchunk_tensor_fnr   r   r   Ú_ext_chunk_tensoru   s    
ÿýûr4   )r   r   r   r1   r   c                 C   s   |d k	r|j nt}|| ||ƒS r/   )r    r   )r   r   r   r1   Zchunk_dtensor_fnr   r   r   Ú_ext_chunk_dtensor‹   s    ÿýýr5   c                 C   s2   |d k	r|  | ¡S t| ƒtks"t‚|  ¡ }| |fS r/   )r!   Útyper   ÚAssertionErrorZlocal_shards)r   r1   Zshardsr   r   r   Ú"_ext_pre_load_state_dict_transform   s
    
r8   )r   r"   r1   r   c                 C   s   |d k	r|j nt}|| |ƒS r/   )r#   r   )r   r"   r1   Zall_gather_dtensor_fnr   r   r   Ú_ext_all_gather_dtensor©   s
    ÿýr9   )N)N)N)N)N)N)$Úabcr   r   Útypingr   r   r   r   r(   Ztorch.distributedÚdistributedr+   Z+torch.distributed._shard.sharded_tensor.apir   Z-torch.distributed._shard.sharded_tensor.shardr	   Ztorch.distributed._tensorr
   r   Z#torch.distributed.fsdp._shard_utilsr   r   r   r   r-   Ú__annotations__r0   r)   r2   r3   r*   r,   r4   r5   r8   r9   r   r   r   r   Ú<module>   sn    H þý ýü úù üû þý ýü