Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
flash-attention
Commits
d732be1e
Commit
d732be1e
authored
May 26, 2024
by
Tri Dao
Browse files
Update to Cutlass 3.5
parent
af627063
Changes
7
Show whitespace changes
Inline
Side-by-side
Showing
7 changed files
with
7 additions
and
8 deletions
+7
-8
csrc/cutlass
csrc/cutlass
+1
-1
csrc/flash_attn/src/flash_bwd_kernel.h
csrc/flash_attn/src/flash_bwd_kernel.h
+1
-1
csrc/flash_attn/src/flash_bwd_preprocess_kernel.h
csrc/flash_attn/src/flash_bwd_preprocess_kernel.h
+1
-1
csrc/flash_attn/src/flash_fwd_kernel.h
csrc/flash_attn/src/flash_fwd_kernel.h
+1
-1
csrc/flash_attn/src/kernel_traits.h
csrc/flash_attn/src/kernel_traits.h
+1
-1
csrc/flash_attn/src/rotary.h
csrc/flash_attn/src/rotary.h
+1
-1
csrc/flash_attn/src/utils.h
csrc/flash_attn/src/utils.h
+1
-2
No files found.
cutlass
@
7d49e6c7
Compare
bbe579a9
...
7d49e6c7
Subproject commit
bbe579a9e3beb6ea6626d9227ec32d0dae119a49
Subproject commit
7d49e6c7e2f8896c47f586706e67e1fb215529dc
csrc/flash_attn/src/flash_bwd_kernel.h
View file @
d732be1e
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#pragma once
#pragma once
#include <cute/
algorithm/copy
.hpp>
#include <cute/
tensor
.hpp>
#include <cutlass/cutlass.h>
#include <cutlass/cutlass.h>
#include <cutlass/array.h>
#include <cutlass/array.h>
...
...
csrc/flash_attn/src/flash_bwd_preprocess_kernel.h
View file @
d732be1e
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#pragma once
#pragma once
#include <cute/
algorithm/copy
.hpp>
#include <cute/
tensor
.hpp>
#include <cutlass/cutlass.h>
#include <cutlass/cutlass.h>
#include <cutlass/array.h>
#include <cutlass/array.h>
...
...
csrc/flash_attn/src/flash_fwd_kernel.h
View file @
d732be1e
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#pragma once
#pragma once
#include <cute/
algorithm/copy
.hpp>
#include <cute/
tensor
.hpp>
#include <cutlass/cutlass.h>
#include <cutlass/cutlass.h>
#include <cutlass/array.h>
#include <cutlass/array.h>
...
...
csrc/flash_attn/src/kernel_traits.h
View file @
d732be1e
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#pragma once
#pragma once
#include "cute/
algorithm/copy
.hpp"
#include "cute/
tensor
.hpp"
#include "cutlass/cutlass.h"
#include "cutlass/cutlass.h"
#include "cutlass/layout/layout.h"
#include "cutlass/layout/layout.h"
...
...
csrc/flash_attn/src/rotary.h
View file @
d732be1e
...
@@ -4,7 +4,7 @@
...
@@ -4,7 +4,7 @@
#pragma once
#pragma once
#include <cute/
algorithm/copy
.hpp>
#include <cute/
tensor
.hpp>
#include "utils.h"
#include "utils.h"
...
...
csrc/flash_attn/src/utils.h
View file @
d732be1e
...
@@ -14,8 +14,7 @@
...
@@ -14,8 +14,7 @@
#include <cuda_bf16.h>
#include <cuda_bf16.h>
#endif
#endif
#include <cute/algorithm/copy.hpp>
#include <cute/tensor.hpp>
#include <cute/algorithm/gemm.hpp>
#include <cutlass/array.h>
#include <cutlass/array.h>
#include <cutlass/cutlass.h>
#include <cutlass/cutlass.h>
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment