// Copyright 2019 Yan Yan // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include #include namespace spconv { namespace functor { template struct SparseGatherFunctor { void operator()(const tv::CPU& d, tv::TensorView buffer, tv::TensorView features, tv::TensorView indices, int size) { int numPlanes = features.dim(1); for (int i = 0; i < size; ++i) { std::memcpy(buffer.data() + i * numPlanes, features.data() + indices[i] * numPlanes, sizeof(T) * numPlanes); } } }; template struct SparseScatterAddFunctor { void operator()(const tv::CPU& d, tv::TensorView outFeatures, tv::TensorView buffer, tv::TensorView indices, int size, bool stable) { int numPlanes = outFeatures.dim(1); const T* buf = buffer.data(); T* out = outFeatures.data(); for (int i = 0; i < size; ++i) { buf = buffer.data() + i * numPlanes; out = outFeatures.data() + indices[i] * numPlanes; for (int j = 0; j < numPlanes; ++j) { out[j] += buf[j]; } } } }; } // namespace functor #define DECLARE_CPU_SPECS_T_INDEX(T, Index) \ template struct functor::SparseGatherFunctor; \ template struct functor::SparseScatterAddFunctor; #define DECLARE_CPU_SPECS(T) \ DECLARE_CPU_SPECS_T_INDEX(T, int); \ DECLARE_CPU_SPECS_T_INDEX(T, long); DECLARE_CPU_SPECS(float); DECLARE_CPU_SPECS(double); DECLARE_CPU_SPECS(at::Half); #undef DECLARE_CPU_SPECS #undef DECLARE_CPU_SPECS_T_INDEX } // namespace spconv