test_msa.py 7.8 KB
Newer Older
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
# Copyright 2021 AlQuraishi Laboratory
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import torch
import numpy as np
import unittest
18
19
20
21
22
23
24
25
26
from openfold.model.msa import (
    MSARowAttentionWithPairBias,
    MSAColumnAttention,
    MSAColumnGlobalAttention,
)
from openfold.utils.tensor_utils import tree_map
import tests.compare_utils as compare_utils
from tests.config import consts

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
27
if compare_utils.alphafold_is_installed():
28
29
30
    alphafold = compare_utils.import_alphafold()
    import jax
    import haiku as hk
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
31
32
33


class TestMSARowAttentionWithPairBias(unittest.TestCase):
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
34
    def test_shape(self):
35
36
37
38
39
        batch_size = consts.batch_size
        n_seq = consts.n_seq
        n_res = consts.n_res
        c_m = consts.c_m
        c_z = consts.c_z
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
40
41
        c = 52
        no_heads = 4
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
42
        chunk_size = None
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
43

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
44
        mrapb = MSARowAttentionWithPairBias(c_m, c_z, c, no_heads)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
45

46
47
        m = torch.rand((batch_size, n_seq, n_res, c_m))
        z = torch.rand((batch_size, n_res, n_res, c_z))
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
48
49

        shape_before = m.shape
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
50
        m = mrapb(m, z=z, chunk_size=chunk_size)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
51
52
53
54
        shape_after = m.shape

        self.assertTrue(shape_before == shape_after)

55
56
57
58
59
60
    @compare_utils.skip_unless_alphafold_installed()
    def test_compare(self):
        def run_msa_row_att(msa_act, msa_mask, pair_act):
            config = compare_utils.get_alphafold_config()
            c_e = config.model.embeddings_and_evoformer.evoformer
            msa_row = alphafold.model.modules.MSARowAttentionWithPairBias(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
61
                c_e.msa_row_attention_with_pair_bias, config.model.global_config
62
            )
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
63
            act = msa_row(msa_act=msa_act, msa_mask=msa_mask, pair_act=pair_act)
64
            return act
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
65

66
67
68
69
70
71
        f = hk.transform(run_msa_row_att)

        n_res = consts.n_res
        n_seq = consts.n_seq

        msa_act = np.random.rand(n_seq, n_res, consts.c_m).astype(np.float32)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
72
73
74
        msa_mask = np.random.randint(low=0, high=2, size=(n_seq, n_res)).astype(
            np.float32
        )
75
76
77
78
        pair_act = np.random.rand(n_res, n_res, consts.c_z).astype(np.float32)

        # Fetch pretrained parameters (but only from one block)]
        params = compare_utils.fetch_alphafold_module_weights(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
79
80
            "alphafold/alphafold_iteration/evoformer/evoformer_iteration/"
            + "msa_row_attention"
81
82
83
84
85
86
87
88
89
        )
        params = tree_map(lambda n: n[0], params, jax.numpy.DeviceArray)

        out_gt = f.apply(
            params, None, msa_act, msa_mask, pair_act
        ).block_until_ready()
        out_gt = torch.as_tensor(np.array(out_gt))

        model = compare_utils.get_global_pretrained_openfold()
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
90
91
92
93
        out_repro = (
            model.evoformer.blocks[0]
            .msa_att_row(
                torch.as_tensor(msa_act).cuda(),
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
94
95
96
                z=torch.as_tensor(pair_act).cuda(),
                chunk_size=4,
                mask=torch.as_tensor(msa_mask).cuda(),
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
97
98
99
            )
            .cpu()
        )
100
101
102

        self.assertTrue(torch.all(torch.abs(out_gt - out_repro) < consts.eps))

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
103
104

class TestMSAColumnAttention(unittest.TestCase):
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
105
    def test_shape(self):
106
107
108
109
        batch_size = consts.batch_size
        n_seq = consts.n_seq
        n_res = consts.n_res
        c_m = consts.c_m
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
110
111
112
113
114
        c = 44
        no_heads = 4

        msaca = MSAColumnAttention(c_m, c, no_heads)

115
        x = torch.rand((batch_size, n_seq, n_res, c_m))
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
116
117

        shape_before = x.shape
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
118
        x = msaca(x, chunk_size=None)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
119
120
121
122
        shape_after = x.shape

        self.assertTrue(shape_before == shape_after)

123
124
125
126
127
128
    @compare_utils.skip_unless_alphafold_installed()
    def test_compare(self):
        def run_msa_col_att(msa_act, msa_mask):
            config = compare_utils.get_alphafold_config()
            c_e = config.model.embeddings_and_evoformer.evoformer
            msa_col = alphafold.model.modules.MSAColumnAttention(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
129
                c_e.msa_column_attention, config.model.global_config
130
            )
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
131
            act = msa_col(msa_act=msa_act, msa_mask=msa_mask)
132
            return act
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
133

134
135
136
137
138
139
        f = hk.transform(run_msa_col_att)

        n_res = consts.n_res
        n_seq = consts.n_seq

        msa_act = np.random.rand(n_seq, n_res, consts.c_m).astype(np.float32)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
140
141
142
        msa_mask = np.random.randint(low=0, high=2, size=(n_seq, n_res)).astype(
            np.float32
        )
143
144
145

        # Fetch pretrained parameters (but only from one block)]
        params = compare_utils.fetch_alphafold_module_weights(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
146
147
            "alphafold/alphafold_iteration/evoformer/evoformer_iteration/"
            + "msa_column_attention"
148
149
150
        )
        params = tree_map(lambda n: n[0], params, jax.numpy.DeviceArray)

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
151
        out_gt = f.apply(params, None, msa_act, msa_mask).block_until_ready()
152
153
154
        out_gt = torch.as_tensor(np.array(out_gt))

        model = compare_utils.get_global_pretrained_openfold()
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
155
156
157
158
        out_repro = (
            model.evoformer.blocks[0]
            .msa_att_col(
                torch.as_tensor(msa_act).cuda(),
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
159
160
                chunk_size=4,
                mask=torch.as_tensor(msa_mask).cuda(),
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
161
162
163
            )
            .cpu()
        )
164
165
166

        self.assertTrue(torch.all(torch.abs(out_gt - out_repro) < consts.eps))

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
167
168

class TestMSAColumnGlobalAttention(unittest.TestCase):
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
169
    def test_shape(self):
170
171
172
173
        batch_size = consts.batch_size
        n_seq = consts.n_seq
        n_res = consts.n_res
        c_m = consts.c_m
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
174
175
176
177
178
        c = 44
        no_heads = 4

        msagca = MSAColumnGlobalAttention(c_m, c, no_heads)

179
        x = torch.rand((batch_size, n_seq, n_res, c_m))
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
180
181

        shape_before = x.shape
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
182
        x = msagca(x, chunk_size=None)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
183
184
185
186
        shape_after = x.shape

        self.assertTrue(shape_before == shape_after)

187
188
189
190
191
192
    @compare_utils.skip_unless_alphafold_installed()
    def test_compare(self):
        def run_msa_col_global_att(msa_act, msa_mask):
            config = compare_utils.get_alphafold_config()
            c_e = config.model.embeddings_and_evoformer.evoformer
            msa_col = alphafold.model.modules.MSAColumnGlobalAttention(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
193
194
195
                c_e.msa_column_attention,
                config.model.global_config,
                name="msa_column_global_attention",
196
197
198
            )
            act = msa_col(msa_act=msa_act, msa_mask=msa_mask)
            return act
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
199

200
        f = hk.transform(run_msa_col_global_att)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
201

202
203
204
        n_res = consts.n_res
        n_seq = consts.n_seq
        c_e = consts.c_e
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
205

206
207
        msa_act = np.random.rand(n_seq, n_res, c_e)
        msa_mask = np.random.randint(low=0, high=2, size=(n_seq, n_res))
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
208

209
210
        # Fetch pretrained parameters (but only from one block)]
        params = compare_utils.fetch_alphafold_module_weights(
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
211
212
            "alphafold/alphafold_iteration/evoformer/extra_msa_stack/"
            + "msa_column_global_attention"
213
214
        )
        params = tree_map(lambda n: n[0], params, jax.numpy.DeviceArray)
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
215
216

        out_gt = f.apply(params, None, msa_act, msa_mask).block_until_ready()
217
        out_gt = torch.as_tensor(np.array(out_gt.block_until_ready()))
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
218

219
        model = compare_utils.get_global_pretrained_openfold()
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
220
221
222
223
        out_repro = (
            model.extra_msa_stack.stack.blocks[0]
            .msa_att_col(
                torch.as_tensor(msa_act, dtype=torch.float32).cuda(),
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
224
                chunk_size=4,
Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
225
226
227
228
229
                mask=torch.as_tensor(msa_mask, dtype=torch.float32).cuda(),
            )
            .cpu()
        )

230
231
        self.assertTrue(torch.max(torch.abs(out_gt - out_repro) < consts.eps))

Gustaf Ahdritz's avatar
Gustaf Ahdritz committed
232
233
234

if __name__ == "__main__":
    unittest.main()