defines.h 622 Bytes
Newer Older
1
2
3
#pragma once

#include <cutlass/bfloat16.h>
zhanghj2's avatar
zhanghj2 committed
4
// #include <cutlass/arch/barrier.h>
5
6

using bf16 = cutlass::bfloat16_t;
zhanghj2's avatar
zhanghj2 committed
7
using fp8 = unsigned char;
zhanghj2's avatar
zhanghj2 committed
8
9
10
11
// using transac_bar_t = cutlass::arch::ClusterTransactionBarrier;
// using cutlass::arch::fence_view_async_shared;
// using cutlass::arch::fence_barrier_init;
// using cutlass::arch::NamedBarrier;
12

zhanghj2's avatar
zhanghj2 committed
13
14
15
// struct int32x8_t {
//     int a0, a1, a2, a3, a4, a5, a6, a7;
// };
16

zhanghj2's avatar
zhanghj2 committed
17
18
19
// struct float8 {
//     // float2 a01, a23, a45, a67;
// };
20

zhanghj2's avatar
zhanghj2 committed
21
22
23
24
25
26
// struct bf16x8 {
//     // __nv_bfloat162 a01;
//     // __nv_bfloat162 a23;
//     // __nv_bfloat162 a45;
//     // __nv_bfloat162 a67;
// };