[NFC] polish colossalai/communication/utils.py code style (#656)

c336cd30 · FredHuang99 · binmakeswell · 5ab9a712 · c336cd30
Commit c336cd30 authored Apr 02, 2022 by FredHuang99 Committed by binmakeswell Apr 06, 2022
Show whitespace changes
Inline Side-by-side

Showing with 2 additions and 6 deletions

colossalai/communication/utils.py colossalai/communication/utils.py +2 -6

No files found.
--- a/colossalai/communication/utils.py
+++ b/colossalai/communication/utils.py
@@ -77,9 +77,7 @@ def split_tensor_into_1d_equal_chunks(tensor, new_buffer=False):
    start_index = partition_size * gpc.get_local_rank(ParallelMode.PARALLEL_1D)
    end_index = start_index + partition_size
    if new_buffer:
-        data = torch.empty(partition_size, dtype=tensor.dtype,
+        data = torch.empty(partition_size, dtype=tensor.dtype, device=torch.cuda.current_device(), requires_grad=False)
-                           device=torch.cuda.current_device(),
-                           requires_grad=False)
        data.copy_(tensor.view(-1)[start_index:end_index])
    else:
        data = tensor.view(-1)[start_index:end_index]
@@ -97,9 +95,7 @@ def gather_split_1d_tensor(tensor):
    world_size = gpc.get_world_size(ParallelMode.PARALLEL_1D)
    numel = torch.numel(tensor)
    numel_gathered = world_size * numel
-    gathered = torch.empty(numel_gathered, dtype=tensor.dtype,
+    gathered = torch.empty(numel_gathered, dtype=tensor.dtype, device=torch.cuda.current_device(), requires_grad=False)
-                           device=torch.cuda.current_device(),
-                           requires_grad=False)
    chunks = [gathered[i * numel:(i + 1) * numel] for i in range(world_size)]
    dist.all_gather(chunks, tensor, group=gpc.get_group(ParallelMode.PARALLEL_1D))
    return gathered