Unverified Commit d88594a3 authored by Lei Wang's avatar Lei Wang Committed by GitHub
Browse files

[Debug] Always include line info in NVCC command for improved profiling and mapping (#1364)

parent f951b924
...@@ -80,8 +80,8 @@ def compile_cuda(code, ...@@ -80,8 +80,8 @@ def compile_cuda(code,
file_target = path_target if path_target else temp_target file_target = path_target if path_target else temp_target
cmd = [get_nvcc_compiler()] cmd = [get_nvcc_compiler()]
cmd += [f"--{target_format}", "-O3"] cmd += [f"--{target_format}", "-O3"]
if kernels_output_dir is not None: # Always include line info for better profiling and mapping
cmd += ["-lineinfo"] cmd += ["-lineinfo"]
if isinstance(arch, list): if isinstance(arch, list):
cmd += arch cmd += arch
elif isinstance(arch, str): elif isinstance(arch, str):
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment