Commit 974d67f2 authored by Andriy Roshchenko's avatar Andriy Roshchenko
Browse files

Add missing constructor.

parent b206fb26
...@@ -334,7 +334,7 @@ struct ThreadwiseTensorSliceTransfer_v3r1 ...@@ -334,7 +334,7 @@ struct ThreadwiseTensorSliceTransfer_v3r1
const bool is_src_valid = src_oob_thread_scratch_tuple_(thread_scratch_id) const bool is_src_valid = src_oob_thread_scratch_tuple_(thread_scratch_id)
.template GetAsType<bool>(src_data_idx_seq); .template GetAsType<bool>(src_data_idx_seq);
auto op_r_v = is_src_valid ? op_r : vector_t(0); auto op_r_v = is_src_valid ? op_r : vector_t{0};
src_thread_scratch_tuple_(thread_scratch_id) src_thread_scratch_tuple_(thread_scratch_id)
.template SetAsType<vector_t>(src_data_idx_seq, op_r_v); .template SetAsType<vector_t>(src_data_idx_seq, op_r_v);
......
...@@ -406,12 +406,12 @@ struct non_native_vector_base<f8_ocp_t, 2> ...@@ -406,12 +406,12 @@ struct non_native_vector_base<f8_ocp_t, 2>
{ {
using data_t = f8_ocp_t::data_type; using data_t = f8_ocp_t::data_type;
using type = non_native_vector_base<f8_ocp_t, 2>; using type = non_native_vector_base<f8_ocp_t, 2>;
__host__ __device__ non_native_vector_base() = default;
using data_v = fp8_impl::fp8x2_storage_t; // type of storage vector using data_v = fp8_impl::fp8x2_storage_t; // type of storage vector
data_v d; // storage vector data_v d; // storage vector
__host__ __device__ non_native_vector_base() = default;
__host__ __device__ non_native_vector_base(data_t a) : d{a} {}
using float2_t = fp8_impl::float2_t; using float2_t = fp8_impl::float2_t;
#if CK_USE_OCP_FP8 #if CK_USE_OCP_FP8
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment