Unverified Commit 989a30a0 authored by gushiqiao's avatar gushiqiao Committed by GitHub
Browse files

Change weight swapping to block swapping (#482)

parent 226e71e1
......@@ -549,7 +549,7 @@ class T5Encoder(nn.Module):
with torch.cuda.stream(self.offload_manager.compute_stream):
x = self.forward_block_with_offload(self.offload_manager.cuda_buffers[0], x, mask, pos_bias=e)
self.offload_manager.swap_weights()
self.offload_manager.swap_blocks()
x = self.norm(x)
x = self.dropout(x)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment