#include #include at::Tensor ROIAlign_Forward_CPU( const at::Tensor& input, const at::Tensor& bottom_rois, int64_t pooled_height, int64_t pooled_width, double spatial_scale, int64_t sampling_ratio); at::Tensor ROIAlign_Backward_CPU( const at::Tensor& bottom_rois, const at::Tensor& grad_output, int64_t b_size, int64_t channels, int64_t height, int64_t width, int64_t pooled_height, int64_t pooled_width, double spatial_scale, int64_t sampling_ratio); at::Tensor Aggregate_Forward_CPU( const at::Tensor A, const at::Tensor X, const at::Tensor C); std::vector Aggregate_Backward_CPU( const at::Tensor GE, const at::Tensor A, const at::Tensor X, const at::Tensor C); at::Tensor ScaledL2_Forward_CPU( const at::Tensor X_, const at::Tensor C_, const at::Tensor S_); std::vector ScaledL2_Backward_CPU( const at::Tensor GSL_, const at::Tensor X_, const at::Tensor C_, const at::Tensor S_, const at::Tensor SL_); at::Tensor BatchNorm_Forward_CPU( const at::Tensor input_, const at::Tensor mean_, const at::Tensor std_, const at::Tensor gamma_, const at::Tensor beta_); std::vector BatchNorm_Backward_CPU( const at::Tensor gradoutput_, const at::Tensor input_, const at::Tensor mean_, const at::Tensor std_, const at::Tensor gamma_, const at::Tensor beta_, bool train); std::vector Sum_Square_Forward_CPU( const at::Tensor input_); at::Tensor Sum_Square_Backward_CPU( const at::Tensor input_, const at::Tensor gradSum_, const at::Tensor gradSquare_); std::vector Non_Max_Suppression_CPU( const at::Tensor& input, const at::Tensor& scores, double thresh);