Commit da80a2e3 authored by guangzlu's avatar guangzlu
Browse files

changed fwd instance parameters

parent 88980945
......@@ -105,9 +105,9 @@ using DeviceGemmInstance =
256,
128, // MPerBlock
128, // NPerBlock
64, // KPerBlock
32, // KPerBlock
64, // Gemm1NPerBlock
64, // Gemm1KPerBlock
32, // Gemm1KPerBlock
8, // AK1
8, // BK1
2, // B1K1
......@@ -130,11 +130,11 @@ using DeviceGemmInstance =
8,
8,
true,
S<8, 32, 1>, // B1BlockTransfer
S<16, 16, 1>, // B1BlockTransfer
S<0, 2, 1>,
S<0, 2, 1>,
1,
2,
4,
2,
false,
1, // CShuffleMXdlPerWavePerShuffle
......
......@@ -101,9 +101,9 @@ using DeviceGemmInstance =
256,
128, // MPerBlock
128, // NPerBlock
64, // KPerBlock
32, // KPerBlock
64, // Gemm1NPerBlock
64, // Gemm1KPerBlock
32, // Gemm1KPerBlock
8, // AK1
8, // BK1
2, // B1K1
......@@ -130,7 +130,7 @@ using DeviceGemmInstance =
S<0, 2, 1>,
S<0, 2, 1>,
1,
2,
4,
2,
false,
1, // CShuffleMXdlPerWavePerShuffle
......
......@@ -105,9 +105,9 @@ using DeviceGemmInstance =
256,
128, // MPerBlock
128, // NPerBlock
64, // KPerBlock
32, // KPerBlock
64, // Gemm1NPerBlock
64, // Gemm1KPerBlock
32, // Gemm1KPerBlock
8, // AK1
8, // BK1
2, // B1K1
......@@ -130,11 +130,11 @@ using DeviceGemmInstance =
8,
8,
true,
S<8, 32, 1>, // B1BlockTransfer
S<16, 16, 1>, // B1BlockTransfer
S<0, 2, 1>,
S<0, 2, 1>,
1,
2,
4,
2,
false,
1, // CShuffleMXdlPerWavePerShuffle
......
......@@ -101,9 +101,9 @@ using DeviceGemmInstance =
256,
128, // MPerBlock
128, // NPerBlock
64, // KPerBlock
32, // KPerBlock
64, // Gemm1NPerBlock
64, // Gemm1KPerBlock
32, // Gemm1KPerBlock
8, // AK1
8, // BK1
2, // B1K1
......@@ -130,7 +130,7 @@ using DeviceGemmInstance =
S<0, 2, 1>,
S<0, 2, 1>,
1,
2,
4,
2,
false,
1, // CShuffleMXdlPerWavePerShuffle
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment