Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
OpenFold
Commits
294c04ad
"git@developer.sourcefind.cn:OpenDAS/sparseconvnet.git" did not exist on "159e5f9a2349c776c422dce9f5b4493519303dc2"
Commit
294c04ad
authored
Jun 23, 2022
by
Brian Loyal
Browse files
Updated code to and fix bad fasta inputs
parent
7cf3125e
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
9 additions
and
11 deletions
+9
-11
run_pretrained_openfold.py
run_pretrained_openfold.py
+9
-11
No files found.
run_pretrained_openfold.py
View file @
294c04ad
...
@@ -29,6 +29,7 @@ import random
...
@@ -29,6 +29,7 @@ import random
import
sys
import
sys
import
time
import
time
import
torch
import
torch
import
re
from
openfold.config
import
model_config
from
openfold.config
import
model_config
from
openfold.data
import
templates
,
feature_pipeline
,
data_pipeline
from
openfold.data
import
templates
,
feature_pipeline
,
data_pipeline
...
@@ -163,6 +164,7 @@ def prep_output(out, batch, feature_dict, feature_processor, args):
...
@@ -163,6 +164,7 @@ def prep_output(out, batch, feature_dict, feature_processor, args):
def
parse_fasta
(
data
):
def
parse_fasta
(
data
):
data
=
re
.
sub
(
'>$'
,
''
,
data
,
flags
=
re
.
M
)
lines
=
[
lines
=
[
l
.
replace
(
'
\n
'
,
''
)
l
.
replace
(
'
\n
'
,
''
)
for
prot
in
data
.
split
(
'>'
)
for
l
in
prot
.
strip
().
split
(
'
\n
'
,
1
)
for
prot
in
data
.
split
(
'>'
)
for
l
in
prot
.
strip
().
split
(
'
\n
'
,
1
)
...
@@ -272,6 +274,8 @@ def load_models_from_command_line(args, config):
...
@@ -272,6 +274,8 @@ def load_models_from_command_line(args, config):
"be specified."
"be specified."
)
)
def
list_files_with_extensions
(
dir
,
extensions
):
return
[
f
for
f
in
os
.
listdir
(
dir
)
if
f
.
endswith
(
extensions
)]
def
main
(
args
):
def
main
(
args
):
# Create the output directory
# Create the output directory
...
@@ -307,19 +311,13 @@ def main(args):
...
@@ -307,19 +311,13 @@ def main(args):
prediction_dir
=
os
.
path
.
join
(
args
.
output_dir
,
"predictions"
)
prediction_dir
=
os
.
path
.
join
(
args
.
output_dir
,
"predictions"
)
os
.
makedirs
(
prediction_dir
,
exist_ok
=
True
)
os
.
makedirs
(
prediction_dir
,
exist_ok
=
True
)
for
fasta_file
in
[
f
for
f
in
os
.
listdir
(
args
.
fasta_dir
)
if
os
.
path
.
splitext
(
f
)[
1
]
in
[
".fasta"
,
".fa"
]]
:
for
fasta_file
in
list_files_with_extensions
(
args
.
fasta_dir
,
(
".fasta"
,
".fa"
))
:
# Gather input sequences
# Gather input sequences
with
open
(
os
.
path
.
join
(
args
.
fasta_dir
,
fasta_file
),
"r"
)
as
fp
:
with
open
(
os
.
path
.
join
(
args
.
fasta_dir
,
fasta_file
),
"r"
)
as
fp
:
data
=
fp
.
read
()
data
=
fp
.
read
()
tags
=
[]
tags
,
seqs
=
parse_fasta
(
data
)
seqs
=
[]
# assert len(tags) == len(set(tags)), "All FASTA tags must be unique"
for
prot
in
data
.
split
(
">"
)[
1
::]:
lines
=
prot
.
strip
().
split
(
"
\n
"
)
tags
.
append
(
lines
[
0
].
strip
().
split
()[
0
])
seqs
.
append
(
""
.
join
(
lines
[
1
:]))
assert
len
(
tags
)
==
len
(
set
(
tags
)),
"All FASTA tags must be unique"
tag
=
'-'
.
join
(
tags
)
tag
=
'-'
.
join
(
tags
)
output_name
=
f
'
{
tag
}
_
{
args
.
config_preset
}
'
output_name
=
f
'
{
tag
}
_
{
args
.
config_preset
}
'
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment