Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
tilelang
Commits
556e87bf
Unverified
Commit
556e87bf
authored
Nov 07, 2025
by
LJC00118
Committed by
GitHub
Nov 07, 2025
Browse files
fix data type (#1204)
parent
0592834f
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
2 additions
and
2 deletions
+2
-2
src/tl_templates/cuda/reduce.h
src/tl_templates/cuda/reduce.h
+2
-2
No files found.
src/tl_templates/cuda/reduce.h
View file @
556e87bf
...
...
@@ -73,7 +73,7 @@ struct SharedReduceWarp {
unsigned
mask
=
__activemask
();
for
(
int
offset
=
kWarpSize
/
2
;
offset
>
0
;
offset
>>=
1
)
{
T
other
=
__
shfl_down_sync
(
mask
,
partial
,
offset
);
T
other
=
tl
::
shfl_down_sync
(
mask
,
partial
,
offset
);
partial
=
Reducer
()(
partial
,
other
);
}
...
...
@@ -159,7 +159,7 @@ template <int threads, bool reverse = false> struct CumSum1D {
#pragma unroll
for
(
int
off
=
1
;
off
<
SEG
;
off
<<=
1
)
{
T
n
=
(
T
)
__
shfl_down_sync
(
MASK
,
val
,
off
);
T
n
=
(
T
)
tl
::
shfl_down_sync
(
MASK
,
val
,
off
);
if
(
lane
<
SEG
-
off
)
val
+=
n
;
}
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment