Unverified Commit 5682e6d3 authored by Jiarui Fang's avatar Jiarui Fang Committed by GitHub
Browse files

[hotfix] correcnt cpu_optim runtime compilation (#2197)

parent 6642cebd
...@@ -48,7 +48,7 @@ class CPUAdamBuilder(Builder): ...@@ -48,7 +48,7 @@ class CPUAdamBuilder(Builder):
sources=[os.path.join('colossalai/kernel/cuda_native/csrc', path) for path in self.sources], sources=[os.path.join('colossalai/kernel/cuda_native/csrc', path) for path in self.sources],
include_dirs=self.extra_include_paths, include_dirs=self.extra_include_paths,
extra_compile_args={ extra_compile_args={
'cxx': ['-O3'] + self.version_dependent_macros + self.extra_cuda_flags, 'cxx': ['-O3'] + self.version_dependent_macros + self.extra_cxx_flags,
'nvcc': 'nvcc':
append_nvcc_threads(['-O3', '--use_fast_math'] + self.version_dependent_macros + append_nvcc_threads(['-O3', '--use_fast_math'] + self.version_dependent_macros +
self.extra_cuda_flags) self.extra_cuda_flags)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment