Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
1197e021
Unverified
Commit
1197e021
authored
May 31, 2024
by
Tyler Michael Smith
Committed by
GitHub
May 31, 2024
Browse files
[Build] Guard against older CUDA versions when building CUTLASS 3.x kernels (#5168)
parent
65757911
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
18 additions
and
3 deletions
+18
-3
csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu
csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu
+8
-2
csrc/quantization/cutlass_w8a8/scaled_mm_dq_entry.cu
csrc/quantization/cutlass_w8a8/scaled_mm_dq_entry.cu
+10
-1
No files found.
csrc/quantization/cutlass_w8a8/scaled_mm_dq_c3x.cu
View file @
1197e021
// clang-format will break include orders
// clang-format off
#include <cudaTypedefs.h>
#if defined CUDA_VERSION && CUDA_VERSION >= 12000
#include <torch/extension.h>
#include <torch/extension.h>
#include <ATen/cuda/CUDAContext.h>
#include <ATen/cuda/CUDAContext.h>
...
@@ -6,8 +12,6 @@
...
@@ -6,8 +12,6 @@
#include <sstream>
#include <sstream>
#include <vector>
#include <vector>
// clang-format will break include orders
// clang-format off
#include "cutlass/cutlass.h"
#include "cutlass/cutlass.h"
#include "cute/tensor.hpp"
#include "cute/tensor.hpp"
...
@@ -241,3 +245,5 @@ void cutlass_scaled_mm_dq_sm90(torch::Tensor& out, torch::Tensor const& a,
...
@@ -241,3 +245,5 @@ void cutlass_scaled_mm_dq_sm90(torch::Tensor& out, torch::Tensor const& a,
}
}
}
}
}
}
#endif
csrc/quantization/cutlass_w8a8/scaled_mm_dq_entry.cu
View file @
1197e021
#include <cudaTypedefs.h>
#include <c10/cuda/CUDAGuard.h>
#include <c10/cuda/CUDAGuard.h>
#include <cuda_runtime.h>
#include <torch/extension.h>
#include <torch/extension.h>
void
cutlass_scaled_mm_dq_sm75
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
void
cutlass_scaled_mm_dq_sm75
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
...
@@ -17,10 +18,12 @@ void cutlass_scaled_mm_dq_sm89(torch::Tensor& c, torch::Tensor const& a,
...
@@ -17,10 +18,12 @@ void cutlass_scaled_mm_dq_sm89(torch::Tensor& c, torch::Tensor const& a,
torch
::
Tensor
const
&
a_scales
,
torch
::
Tensor
const
&
a_scales
,
torch
::
Tensor
const
&
b_scales
);
torch
::
Tensor
const
&
b_scales
);
#if defined CUDA_VERSION && CUDA_VERSION >= 12000
void
cutlass_scaled_mm_dq_sm90
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
void
cutlass_scaled_mm_dq_sm90
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
torch
::
Tensor
const
&
b
,
torch
::
Tensor
const
&
b
,
torch
::
Tensor
const
&
a_scales
,
torch
::
Tensor
const
&
a_scales
,
torch
::
Tensor
const
&
b_scales
);
torch
::
Tensor
const
&
b_scales
);
#endif
void
cutlass_scaled_mm_dq
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
void
cutlass_scaled_mm_dq
(
torch
::
Tensor
&
c
,
torch
::
Tensor
const
&
a
,
torch
::
Tensor
const
&
b
,
torch
::
Tensor
const
&
a_scales
,
torch
::
Tensor
const
&
b
,
torch
::
Tensor
const
&
a_scales
,
...
@@ -51,7 +54,13 @@ void cutlass_scaled_mm_dq(torch::Tensor& c, torch::Tensor const& a,
...
@@ -51,7 +54,13 @@ void cutlass_scaled_mm_dq(torch::Tensor& c, torch::Tensor const& a,
if
(
version_num
>=
90
)
{
if
(
version_num
>=
90
)
{
// Hopper
// Hopper
// Guard against compilation issues for sm90 kernels
#if defined CUDA_VERSION && CUDA_VERSION >= 12000
cutlass_scaled_mm_dq_sm90
(
c
,
a
,
b
,
a_scales
,
b_scales
);
cutlass_scaled_mm_dq_sm90
(
c
,
a
,
b
,
a_scales
,
b_scales
);
#else
cutlass_scaled_mm_dq_sm80
(
c
,
a
,
b
,
a_scales
,
b_scales
);
#endif
}
else
if
(
version_num
==
89
)
{
}
else
if
(
version_num
==
89
)
{
// Ada Lovelace
// Ada Lovelace
cutlass_scaled_mm_dq_sm89
(
c
,
a
,
b
,
a_scales
,
b_scales
);
cutlass_scaled_mm_dq_sm89
(
c
,
a
,
b
,
a_scales
,
b_scales
);
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment