Fix precision bug

a17a9777 · Gustaf Ahdritz · 48670cfc · a17a9777 · a17a9777 · a17a9777
Commit a17a9777 authored Oct 06, 2022 by Gustaf Ahdritz
4 changed files
--- a/openfold/model/heads.py
+++ b/openfold/model/heads.py
@@ -150,15 +150,15 @@ class DistogramHead(nn.Module):
        logits = logits + logits.transpose(-2, -3)
        return logits
    
-    def forward(self, z):
-        
+    def forward(self, z): 
        float16_enabled = (torch.get_autocast_gpu_dtype() == torch.float16)
        if float16_enabled and torch.is_autocast_enabled():
            with torch.cuda.amp.autocast(enabled=False):
                return self._forward(z.float())
        else:
            return self._forward(z)
-        
+
+
 class TMScoreHead(nn.Module):
    """
    For use in computation of TM-score, subsection 1.9.7

--- a/openfold/model/primitives.py
+++ b/openfold/model/primitives.py
@@ -480,8 +480,9 @@ class Attention(nn.Module):

        # [*, Q, H, C_hidden]
        float16_enabled = (torch.get_autocast_gpu_dtype() == torch.float16)
-        if float16_enabled:
+        if float16_enabled and torch.is_autocast_enabled():
            use_memory_efficient_kernel = False
+        
        if(use_memory_efficient_kernel):
            if(len(biases) > 2):
                raise ValueError(

--- a/openfold/model/structure_module.py
+++ b/openfold/model/structure_module.py
@@ -324,6 +324,7 @@ class InvariantPointAttention(nn.Module):
                permute_final_dims(q, (1, 0, 2)),  # [*, H, N_res, C_hidden]
                permute_final_dims(k, (1, 2, 0)),  # [*, H, C_hidden, N_res]
            )
+        
        a *= math.sqrt(1.0 / (3 * self.c_hidden))
        a += (math.sqrt(1.0 / 3) * permute_final_dims(b, (2, 0, 1)))


--- a/openfold/model/triangular_multiplicative_update.py
+++ b/openfold/model/triangular_multiplicative_update.py
@@ -391,12 +391,14 @@ class TriangleMultiplicativeUpdate(nn.Module):
        b = mask
        b = b * self.sigmoid(self.linear_b_g(z))
        b = b * self.linear_b_p(z)
+        
        float16_enabled = (torch.get_autocast_gpu_dtype() == torch.float16)
        if float16_enabled and torch.is_autocast_enabled():
            with torch.cuda.amp.autocast(enabled=False):
                x = self._combine_projections(a.float(), b.float())
        else:
            x = self._combine_projections(a, b)
+        
        del a, b
        x = self.layer_norm_out(x)
        x = self.linear_z(x)