"examples/vscode:/vscode.git/clone" did not exist on "3ddc2b73957a0d2172664ce9551c4fd5c9b8380c"
Commit 82cc8731 authored by Po-Yen, Chen's avatar Po-Yen, Chen
Browse files

Add new example 'example_permute_NxHxW_fp32'

parent 01ca856c
add_custom_target(example_permute) add_custom_target(example_permute)
add_example_executable(example_permute_1xHxW_fp32 permute_1xHxW_fp32.cpp) add_example_executable(example_permute_1xHxW_fp32 permute_1xHxW_fp32.cpp)
add_example_executable(example_permute_NxHxW_fp32 permute_NxHxW_fp32.cpp)
add_dependencies(example_permute example_permute_1xHxW_fp32) add_dependencies(example_permute example_permute_1xHxW_fp32)
add_dependencies(example_permute example_permute_NxHxW_fp32)
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2022, Advanced Micro Devices, Inc. All rights reserved.
#include "common.hpp"
using ADataType = F32;
using BDataType = F32;
// clang-format off
using DevicePermuteInstance = ck::tensor_operation::device::DevicePermute
// ######| InData| OutData| Elementwise| NumDim| Block| HPer| WPer| InBlock| InBlockTransfer| InBlockTransfer| Src| Dst| Src| Dst|
// ######| Type| Type| Operation| | Size| Block| Block| LdsExtraW| ThreadClusterLengths| ThreadClusterArrangeOrder| VectorDim| VectorDim| ScalarPerVector| ScalarPerVector|
// ######| | | | | | | | | | | | | | |
// ######| | | | | | | | | | | | | | |
< ADataType, BDataType, PassThrough, 3, 256, 128, 128, 0, S<1, 16, 16>, S<0, 1, 2>, 2, 1, 1, 1>;
// clang-format on
#include "run_permute_example.inc"
int main(int argc, char* argv[])
{
return !run_permute_example(argc, argv, {11, 768, 80}, {0, 2, 1});
}
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment