Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
OpenFold
Commits
81ae777d
Commit
81ae777d
authored
Oct 26, 2021
by
Gustaf Ahdritz
Browse files
Make template parsing optional
parent
ea484b71
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
33 additions
and
22 deletions
+33
-22
openfold/data/data_pipeline.py
openfold/data/data_pipeline.py
+33
-22
No files found.
openfold/data/data_pipeline.py
View file @
81ae777d
...
...
@@ -339,12 +339,16 @@ class DataPipeline:
hits
=
self
.
_parse_template_hits
(
alignment_dir
)
hits_cat
=
sum
(
hits
.
values
(),
[])
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
None
,
hits
=
hits_cat
,
)
if
(
len
(
hits_cat
)
==
0
):
template_features
=
{}
else
:
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
None
,
hits
=
hits_cat
,
)
template_features
=
templates_result
.
features
sequence_features
=
make_sequence_features
(
sequence
=
input_sequence
,
...
...
@@ -357,7 +361,7 @@ class DataPipeline:
return
{
**
sequence_features
,
**
msa_features
,
**
template
s_result
.
features
**
template
_
features
}
def
process_mmcif
(
...
...
@@ -384,17 +388,20 @@ class DataPipeline:
input_sequence
=
mmcif
.
chain_to_seqres
[
chain_id
]
hits
=
self
.
_parse_template_hits
(
alignment_dir
)
hits_cat
=
sum
(
hits
.
values
(),
[])
print
(
len
(
hits_cat
))
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
to_date
(
mmcif
.
header
[
"release_date"
]),
hits
=
hits_cat
,
)
if
(
len
(
hits_cat
)
==
0
):
template_features
=
{}
else
:
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
to_date
(
mmcif
.
header
[
"release_date"
]),
hits
=
hits_cat
,
)
template_features
=
templates_result
.
features
msa_features
=
self
.
_process_msa_feats
(
alignment_dir
)
return
{
**
mmcif_feats
,
**
template
s_result
.
features
,
**
msa_features
}
return
{
**
mmcif_feats
,
**
template
_
features
,
**
msa_features
}
def
process_pdb
(
self
,
...
...
@@ -413,13 +420,17 @@ class DataPipeline:
hits
=
self
.
_parse_template_hits
(
alignment_dir
)
hits_cat
=
sum
(
hits
.
values
(),
[])
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
None
,
hits
=
hits_cat
,
)
if
(
len
(
hits_cat
)
==
0
):
template_features
=
{}
else
:
templates_result
=
self
.
template_featurizer
.
get_templates
(
query_sequence
=
input_sequence
,
query_pdb_code
=
None
,
query_release_date
=
None
,
hits
=
hits_cat
,
)
template_features
=
templates_result
.
features
msa_features
=
self
.
_process_msa_feats
(
alignment_dir
)
return
{
**
pdb_feats
,
**
template
s_result
.
features
,
**
msa_features
}
return
{
**
pdb_feats
,
**
template
_
features
,
**
msa_features
}
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment