Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
deepspeed
Commits
eea1c285
"src/vscode:/vscode.git/clone" did not exist on "23e091564fbfea1d3b56b5e293f4244367f65a8f"
Unverified
Commit
eea1c285
authored
Nov 11, 2020
by
Jeff Rasley
Committed by
GitHub
Nov 11, 2020
Browse files
fix bug on non-DLTS infra when no output path set (#523)
parent
be1147c0
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
10 additions
and
3 deletions
+10
-3
deepspeed/runtime/engine.py
deepspeed/runtime/engine.py
+10
-3
No files found.
deepspeed/runtime/engine.py
View file @
eea1c285
...
...
@@ -38,7 +38,6 @@ from deepspeed.runtime.progressive_layer_drop import ProgressiveLayerDrop
from
.utils
import
ensure_directory_exists
MEMORY_OPT_ALLREDUCE_SIZE
=
500000000
SUMMARY_WRITER_DIR_NAME
=
"JobId"
try
:
from
apex_C
import
flatten
...
...
@@ -271,9 +270,17 @@ class DeepSpeedEngine(Module):
else
:
if
self
.
tensorboard_job_name
():
name
=
self
.
tensorboard_job_name
()
# Infrastructure-specific job-id
if
'DLWS_JOB_ID'
in
os
.
environ
:
SUMMARY_WRITER_DIR_NAME
=
os
.
path
.
join
(
os
.
environ
[
'DLWS_JOB_ID'
],
"logs"
)
log_dir
=
os
.
path
.
join
(
base
,
SUMMARY_WRITER_DIR_NAME
,
name
)
infra_job_id
=
os
.
environ
[
'DLWS_JOB_ID'
]
elif
'DLTS_JOB_ID'
in
os
.
environ
:
infra_job_id
=
os
.
environ
[
'DLTS_JOB_ID'
]
else
:
infra_job_id
=
'unknown-job-id'
summary_writer_dir_name
=
os
.
path
.
join
(
infra_job_id
,
"logs"
)
log_dir
=
os
.
path
.
join
(
base
,
summary_writer_dir_name
,
name
)
os
.
makedirs
(
log_dir
,
exist_ok
=
True
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment