group_points.cpp 2.37 KB
Newer Older
zhangwenwei's avatar
zhangwenwei committed
1
#include <THC/THC.h>
wuyuefeng's avatar
wuyuefeng committed
2
3
4
#include <cuda.h>
#include <cuda_runtime_api.h>
#include <torch/extension.h>
zhangwenwei's avatar
zhangwenwei committed
5
6
7
#include <torch/serialize/tensor.h>

#include <vector>
wuyuefeng's avatar
wuyuefeng committed
8
9
10
11

extern THCState *state;

int group_points_wrapper(int b, int c, int n, int npoints, int nsample,
zhangwenwei's avatar
zhangwenwei committed
12
13
                         at::Tensor points_tensor, at::Tensor idx_tensor,
                         at::Tensor out_tensor);
wuyuefeng's avatar
wuyuefeng committed
14
15

void group_points_kernel_launcher(int b, int c, int n, int npoints, int nsample,
zhangwenwei's avatar
zhangwenwei committed
16
17
                                  const float *points, const int *idx,
                                  float *out, cudaStream_t stream);
wuyuefeng's avatar
wuyuefeng committed
18
19

int group_points_grad_wrapper(int b, int c, int n, int npoints, int nsample,
zhangwenwei's avatar
zhangwenwei committed
20
21
                              at::Tensor grad_out_tensor, at::Tensor idx_tensor,
                              at::Tensor grad_points_tensor);
wuyuefeng's avatar
wuyuefeng committed
22

zhangwenwei's avatar
zhangwenwei committed
23
24
25
26
void group_points_grad_kernel_launcher(int b, int c, int n, int npoints,
                                       int nsample, const float *grad_out,
                                       const int *idx, float *grad_points,
                                       cudaStream_t stream);
wuyuefeng's avatar
wuyuefeng committed
27
28

int group_points_grad_wrapper(int b, int c, int n, int npoints, int nsample,
zhangwenwei's avatar
zhangwenwei committed
29
30
31
32
33
                              at::Tensor grad_out_tensor, at::Tensor idx_tensor,
                              at::Tensor grad_points_tensor) {
  float *grad_points = grad_points_tensor.data_ptr<float>();
  const int *idx = idx_tensor.data_ptr<int>();
  const float *grad_out = grad_out_tensor.data_ptr<float>();
wuyuefeng's avatar
wuyuefeng committed
34

zhangwenwei's avatar
zhangwenwei committed
35
  cudaStream_t stream = THCState_getCurrentStream(state);
wuyuefeng's avatar
wuyuefeng committed
36

zhangwenwei's avatar
zhangwenwei committed
37
38
39
  group_points_grad_kernel_launcher(b, c, n, npoints, nsample, grad_out, idx,
                                    grad_points, stream);
  return 1;
wuyuefeng's avatar
wuyuefeng committed
40
41
42
}

int group_points_wrapper(int b, int c, int n, int npoints, int nsample,
zhangwenwei's avatar
zhangwenwei committed
43
44
45
46
47
                         at::Tensor points_tensor, at::Tensor idx_tensor,
                         at::Tensor out_tensor) {
  const float *points = points_tensor.data_ptr<float>();
  const int *idx = idx_tensor.data_ptr<int>();
  float *out = out_tensor.data_ptr<float>();
wuyuefeng's avatar
wuyuefeng committed
48

zhangwenwei's avatar
zhangwenwei committed
49
  cudaStream_t stream = THCState_getCurrentStream(state);
wuyuefeng's avatar
wuyuefeng committed
50

zhangwenwei's avatar
zhangwenwei committed
51
52
53
  group_points_kernel_launcher(b, c, n, npoints, nsample, points, idx, out,
                               stream);
  return 1;
wuyuefeng's avatar
wuyuefeng committed
54
55
56
}

PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
zhangwenwei's avatar
zhangwenwei committed
57
58
  m.def("forward", &group_points_wrapper, "group_points_wrapper");
  m.def("backward", &group_points_grad_wrapper, "group_points_grad_wrapper");
wuyuefeng's avatar
wuyuefeng committed
59
}