Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
deepspeed
Commits
25d5540b
Commit
25d5540b
authored
Jun 14, 2023
by
aiss
Browse files
add block_thread arg
parent
1c0bde25
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
5 additions
and
3 deletions
+5
-3
op_builder/fused_adam.py
op_builder/fused_adam.py
+2
-1
op_builder/fused_lamb.py
op_builder/fused_lamb.py
+2
-1
run.sh
run.sh
+1
-1
No files found.
op_builder/fused_adam.py
View file @
25d5540b
...
...
@@ -29,7 +29,8 @@ class FusedAdamBuilder(CUDAOpBuilder):
return
args
+
self
.
version_dependent_macros
()
def
nvcc_args
(
self
):
nvcc_flags
=
[
'-O3'
]
+
self
.
version_dependent_macros
()
nvcc_flags
=
super
().
nvcc_args
()
nvcc_flags
+=
[
'-O3'
]
+
self
.
version_dependent_macros
()
if
not
self
.
is_rocm_pytorch
():
nvcc_flags
.
extend
(
[
'-allow-unsupported-compiler'
if
sys
.
platform
==
"win32"
else
''
,
'-lineinfo'
,
'--use_fast_math'
]
+
...
...
op_builder/fused_lamb.py
View file @
25d5540b
...
...
@@ -29,7 +29,8 @@ class FusedLambBuilder(CUDAOpBuilder):
return
args
+
self
.
version_dependent_macros
()
def
nvcc_args
(
self
):
nvcc_flags
=
[
'-O3'
]
+
self
.
version_dependent_macros
()
nvcc_flags
=
super
().
nvcc_args
()
nvcc_flags
+=
[
'-O3'
]
+
self
.
version_dependent_macros
()
if
self
.
is_rocm_pytorch
():
ROCM_MAJOR
,
ROCM_MINOR
=
self
.
installed_rocm_version
()
nvcc_flags
+=
[
'-DROCM_VERSION_MAJOR=%s'
%
ROCM_MAJOR
,
'-DROCM_VERSION_MINOR=%s'
%
ROCM_MINOR
]
...
...
run.sh
View file @
25d5540b
...
...
@@ -2,4 +2,4 @@
export
LIBRARY_PATH
=
/usr/local/lib:
$LIBRARY_PATH
#export DS_BUILD_VERSION=dtk22.10.1
export
LD_LIBRARY_PATH
=
/usr/local/lib/python3.7/site-packages/torch/lib:
$LD_LIBRARY_PATH
DS_BUILD_STRING
=
.dtk22.10.1.torch1.10
DS_BUILD_RANDOM_LTD
=
0
DS_BUILD_QUANTIZER
=
0
DS_BUILD_TRANSFORMER_INFERENCE
=
0
DS_BUILD_OPS
=
1
verbose
=
1
CXX
=
hipcc
CC
=
hipcc python3 setup.py
install
bdist_wheel
DS_BUILD_RANDOM_LTD
=
0
DS_BUILD_QUANTIZER
=
0
DS_BUILD_TRANSFORMER_INFERENCE
=
0
DS_BUILD_OPS
=
1
verbose
=
1
CXX
=
hipcc
CC
=
hipcc python3 setup.py
install
bdist_wheel
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment