Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
gaoqiong
composable_kernel
Commits
da80a2e3
Commit
da80a2e3
authored
Mar 06, 2023
by
guangzlu
Browse files
changed fwd instance parameters
parent
88980945
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
14 additions
and
14 deletions
+14
-14
example/32_batched_gemm_scale_softmax_gemm/batched_multihead_attention_forward.cpp
...cale_softmax_gemm/batched_multihead_attention_forward.cpp
+4
-4
example/32_batched_gemm_scale_softmax_gemm/batched_multihead_attention_forward_bf16.cpp
...softmax_gemm/batched_multihead_attention_forward_bf16.cpp
+3
-3
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_forward.cpp
...cale_softmax_gemm/grouped_multihead_attention_forward.cpp
+4
-4
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_forward_bf16.cpp
...softmax_gemm/grouped_multihead_attention_forward_bf16.cpp
+3
-3
No files found.
example/32_batched_gemm_scale_softmax_gemm/batched_multihead_attention_forward.cpp
View file @
da80a2e3
...
...
@@ -105,9 +105,9 @@ using DeviceGemmInstance =
256
,
128
,
// MPerBlock
128
,
// NPerBlock
64
,
// KPerBlock
32
,
// KPerBlock
64
,
// Gemm1NPerBlock
64
,
// Gemm1KPerBlock
32
,
// Gemm1KPerBlock
8
,
// AK1
8
,
// BK1
2
,
// B1K1
...
...
@@ -130,11 +130,11 @@ using DeviceGemmInstance =
8
,
8
,
true
,
S
<
8
,
32
,
1
>
,
// B1BlockTransfer
S
<
16
,
16
,
1
>
,
// B1BlockTransfer
S
<
0
,
2
,
1
>
,
S
<
0
,
2
,
1
>
,
1
,
2
,
4
,
2
,
false
,
1
,
// CShuffleMXdlPerWavePerShuffle
...
...
example/32_batched_gemm_scale_softmax_gemm/batched_multihead_attention_forward_bf16.cpp
View file @
da80a2e3
...
...
@@ -101,9 +101,9 @@ using DeviceGemmInstance =
256
,
128
,
// MPerBlock
128
,
// NPerBlock
64
,
// KPerBlock
32
,
// KPerBlock
64
,
// Gemm1NPerBlock
64
,
// Gemm1KPerBlock
32
,
// Gemm1KPerBlock
8
,
// AK1
8
,
// BK1
2
,
// B1K1
...
...
@@ -130,7 +130,7 @@ using DeviceGemmInstance =
S
<
0
,
2
,
1
>
,
S
<
0
,
2
,
1
>
,
1
,
2
,
4
,
2
,
false
,
1
,
// CShuffleMXdlPerWavePerShuffle
...
...
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_forward.cpp
View file @
da80a2e3
...
...
@@ -105,9 +105,9 @@ using DeviceGemmInstance =
256
,
128
,
// MPerBlock
128
,
// NPerBlock
64
,
// KPerBlock
32
,
// KPerBlock
64
,
// Gemm1NPerBlock
64
,
// Gemm1KPerBlock
32
,
// Gemm1KPerBlock
8
,
// AK1
8
,
// BK1
2
,
// B1K1
...
...
@@ -130,11 +130,11 @@ using DeviceGemmInstance =
8
,
8
,
true
,
S
<
8
,
32
,
1
>
,
// B1BlockTransfer
S
<
16
,
16
,
1
>
,
// B1BlockTransfer
S
<
0
,
2
,
1
>
,
S
<
0
,
2
,
1
>
,
1
,
2
,
4
,
2
,
false
,
1
,
// CShuffleMXdlPerWavePerShuffle
...
...
example/32_batched_gemm_scale_softmax_gemm/grouped_multihead_attention_forward_bf16.cpp
View file @
da80a2e3
...
...
@@ -101,9 +101,9 @@ using DeviceGemmInstance =
256
,
128
,
// MPerBlock
128
,
// NPerBlock
64
,
// KPerBlock
32
,
// KPerBlock
64
,
// Gemm1NPerBlock
64
,
// Gemm1KPerBlock
32
,
// Gemm1KPerBlock
8
,
// AK1
8
,
// BK1
2
,
// B1K1
...
...
@@ -130,7 +130,7 @@ using DeviceGemmInstance =
S
<
0
,
2
,
1
>
,
S
<
0
,
2
,
1
>
,
1
,
2
,
4
,
2
,
false
,
1
,
// CShuffleMXdlPerWavePerShuffle
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment