permute_NxHxW_fp16.cpp 1.39 KB
Newer Older
1
2
3
4
5
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.

#include "common.hpp"

6
7
using InDataType  = F16;
using OutDataType = F16;
8
9
10

// clang-format off
using DevicePermuteInstance = ck::tensor_operation::device::DevicePermute
11
12
13
14
15
// ######|     InData|     OutData| Elementwise| NumDim| Block|  NPer|  HPer|  WPer|   InBlock|      InBlockTransfer|           InBlockTransfer|       Src|       Dst|             Src|             Dst|
// ######|       Type|        Type|   Operation|       |  Size| Block| Block| Block| LdsExtraW| ThreadClusterLengths| ThreadClusterArrangeOrder| VectorDim| VectorDim| ScalarPerVector| ScalarPerVector|
// ######|           |            |            |       |      |      |      |      |          |                     |                          |          |          |                |                |
// ######|           |            |            |       |      |      |      |      |          |                     |                          |          |          |                |                |
         < InDataType, OutDataType, PassThrough,      3,   128,     4,    16,     8,         6,          S<2, 16, 4>,                S<0, 1, 2>,         2,         1,               2,               1>;
16
17
// clang-format on

Po-Yen, Chen's avatar
Po-Yen, Chen committed
18
#include "run_permute_element_example.inc"
19

Po-Yen, Chen's avatar
Po-Yen, Chen committed
20
int main() { return !run_permute_element_example({121, 768, 80}, {0, 2, 1}); }