Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
8a34c508
Unverified
Commit
8a34c508
authored
Apr 09, 2026
by
Andrew Barnes
Committed by
GitHub
Apr 09, 2026
Browse files
[ROCm] Remove unnecessary fp8 roundtrip in gather cache NHD dequant (#39122)
Signed-off-by:
Bortlesboat
<
bortstheboat@gmail.com
>
parent
ed2f282b
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
6 additions
and
4 deletions
+6
-4
vllm/v1/attention/backends/rocm_aiter_fa.py
vllm/v1/attention/backends/rocm_aiter_fa.py
+6
-4
No files found.
vllm/v1/attention/backends/rocm_aiter_fa.py
View file @
8a34c508
...
@@ -112,10 +112,12 @@ if current_platform.is_rocm():
...
@@ -112,10 +112,12 @@ if current_platform.is_rocm():
if
DEQUANT
:
if
DEQUANT
:
k_scale
=
tl
.
load
(
k_scale_ptr
)
k_scale
=
tl
.
load
(
k_scale_ptr
)
v_scale
=
tl
.
load
(
v_scale_ptr
)
v_scale
=
tl
.
load
(
v_scale_ptr
)
k_dtype
=
k_reg
.
dtype
k_reg
=
(
k_reg
.
to
(
tl
.
float32
)
*
k_scale
).
to
(
v_dtype
=
v_reg
.
dtype
key_ptr_offset
.
dtype
.
element_ty
k_reg
=
(
k_reg
.
to
(
tl
.
float32
)
*
k_scale
).
to
(
k_dtype
)
)
v_reg
=
(
v_reg
.
to
(
tl
.
float32
)
*
v_scale
).
to
(
v_dtype
)
v_reg
=
(
v_reg
.
to
(
tl
.
float32
)
*
v_scale
).
to
(
value_ptr_offset
.
dtype
.
element_ty
)
tl
.
store
(
key_ptr_offset
+
col_offsets
,
k_reg
)
tl
.
store
(
key_ptr_offset
+
col_offsets
,
k_reg
)
tl
.
store
(
value_ptr_offset
+
col_offsets
,
v_reg
)
tl
.
store
(
value_ptr_offset
+
col_offsets
,
v_reg
)
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment