Commit 19d090cb authored by Sachin Kadyan's avatar Sachin Kadyan
Browse files

Added switch in inference flow for using sequence embedding instead of MSAs.

- Added a `seq_emb` bool flag to `data_pipeline > process_fasta()`
- In `seqemb_mode` use dummy MSA features instead of full ones.
parent e40900d8
...@@ -643,6 +643,7 @@ class DataPipeline: ...@@ -643,6 +643,7 @@ class DataPipeline:
fasta_path: str, fasta_path: str,
alignment_dir: str, alignment_dir: str,
alignment_index: Optional[str] = None, alignment_index: Optional[str] = None,
seqemb_mode: bool = False,
) -> FeatureDict: ) -> FeatureDict:
"""Assembles features for a single sequence in a FASTA file""" """Assembles features for a single sequence in a FASTA file"""
with open(fasta_path) as f: with open(fasta_path) as f:
...@@ -668,8 +669,10 @@ class DataPipeline: ...@@ -668,8 +669,10 @@ class DataPipeline:
description=input_description, description=input_description,
num_res=num_res, num_res=num_res,
) )
if seqemb_mode:
msa_features = self._process_msa_feats(alignment_dir, input_sequence, alignment_index) msa_features = make_dummy_msa_feats(input_sequence)
else:
msa_features = self._process_msa_feats(alignment_dir, input_sequence, alignment_index)
return { return {
**sequence_features, **sequence_features,
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment