"test/transforms_v2_kernel_infos.py" did not exist on "8b4bb5f13d72f6564d300e2749b3c563d8a2ff81"
vision.cpp 5.19 KB
Newer Older
1
2
3
4
5
6
#include <Python.h>
#include <torch/script.h>

#ifdef WITH_CUDA
#include <cuda.h>
#endif
7
8
9
#ifdef WITH_HIP
#include <hip/hip_runtime.h>
#endif
10

11
#include "DeformConv.h"
12
13
#include "PSROIAlign.h"
#include "PSROIPool.h"
14
15
#include "ROIAlign.h"
#include "ROIPool.h"
eellison's avatar
eellison committed
16
#include "empty_tensor_op.h"
17
18
#include "nms.h"

19
// If we are in a Windows environment, we need to define
20
// initialization functions for the _C extension
21
22
#ifdef _WIN32
#if PY_MAJOR_VERSION < 3
23
PyMODINIT_FUNC init_C(void) {
24
  // No need to do anything.
25
  // extension.py will run on load
26
27
28
  return NULL;
}
#else
29
PyMODINIT_FUNC PyInit__C(void) {
30
  // No need to do anything.
31
  // extension.py will run on load
32
33
34
  return NULL;
}
#endif
35
36
#endif

37
38
namespace vision {
int64_t cuda_version() noexcept {
39
#ifdef WITH_CUDA
40
41
42
  return CUDA_VERSION;
#else
  return -1;
43
#endif
44
}
45
} // namespace vision
46

47
TORCH_LIBRARY(torchvision, m) {
48
49
50
51
  m.def(
      "deform_conv2d(Tensor input, Tensor weight, Tensor offset, Tensor bias, int stride_h, int stride_w, int pad_h, int pad_w, int dilation_h, int dilation_w, int groups, int offset_groups) -> Tensor");
  m.def(
      "_deform_conv2d_backward(Tensor grad, Tensor input, Tensor weight, Tensor offset, Tensor bias, int stride_h, int stride_w, int pad_h, int pad_w, int dilation_h, int dilation_w, int groups, int offset_groups) -> (Tensor, Tensor, Tensor, Tensor)");
52
  m.def("nms(Tensor dets, Tensor scores, float iou_threshold) -> Tensor");
53
  m.def(
54
      "ps_roi_align(Tensor input, Tensor rois, float spatial_scale, int pooled_height, int pooled_width, int sampling_ratio) -> (Tensor, Tensor)");
55
  m.def(
56
      "_ps_roi_align_backward(Tensor grad, Tensor rois, Tensor channel_mapping, float spatial_scale, int pooled_height, int pooled_width, int sampling_ratio, int batch_size, int channels, int height, int width) -> Tensor");
57
  m.def(
58
      "ps_roi_pool(Tensor input, Tensor rois, float spatial_scale, int pooled_height, int pooled_width) -> (Tensor, Tensor)");
59
  m.def(
60
      "_ps_roi_pool_backward(Tensor grad, Tensor rois, Tensor channel_mapping, float spatial_scale, int pooled_height, int pooled_width, int batch_size, int channels, int height, int width) -> Tensor");
61
  m.def(
62
      "roi_align(Tensor input, Tensor rois, float spatial_scale, int pooled_height, int pooled_width, int sampling_ratio, bool aligned) -> Tensor");
63
  m.def(
64
      "_roi_align_backward(Tensor grad, Tensor rois, float spatial_scale, int pooled_height, int pooled_width, int batch_size, int channels, int height, int width, int sampling_ratio, bool aligned) -> Tensor");
65
  m.def(
66
      "roi_pool(Tensor input, Tensor rois, float spatial_scale, int pooled_height, int pooled_width) -> (Tensor, Tensor)");
67
  m.def(
68
      "_roi_pool_backward(Tensor grad, Tensor rois, Tensor argmax, float spatial_scale, int pooled_height, int pooled_width, int batch_size, int channels, int height, int width) -> Tensor");
69
  m.def("_cuda_version", &vision::cuda_version);
70
  m.def("_new_empty_tensor_op", &new_empty_tensor);
71
72
73
}

TORCH_LIBRARY_IMPL(torchvision, CPU, m) {
74
75
  m.impl("deform_conv2d", DeformConv2d_forward_cpu);
  m.impl("_deform_conv2d_backward", DeformConv2d_backward_cpu);
76
  m.impl("nms", nms_cpu);
77
78
  m.impl("ps_roi_align", PSROIAlign_forward_cpu);
  m.impl("_ps_roi_align_backward", PSROIAlign_backward_cpu);
79
80
81
82
83
84
  m.impl("ps_roi_pool", PSROIPool_forward_cpu);
  m.impl("_ps_roi_pool_backward", PSROIPool_backward_cpu);
  m.impl("roi_align", ROIAlign_forward_cpu);
  m.impl("_roi_align_backward", ROIAlign_backward_cpu);
  m.impl("roi_pool", ROIPool_forward_cpu);
  m.impl("_roi_pool_backward", ROIPool_backward_cpu);
85
86
87
88
89
}

// TODO: Place this in a hypothetical separate torchvision_cuda library
#if defined(WITH_CUDA) || defined(WITH_HIP)
TORCH_LIBRARY_IMPL(torchvision, CUDA, m) {
90
91
  m.impl("deform_conv2d", DeformConv2d_forward_cuda);
  m.impl("_deform_conv2d_backward", DeformConv2d_backward_cuda);
92
  m.impl("nms", nms_cuda);
93
94
  m.impl("ps_roi_align", PSROIAlign_forward_cuda);
  m.impl("_ps_roi_align_backward", PSROIAlign_backward_cuda);
95
96
97
98
99
100
  m.impl("ps_roi_pool", PSROIPool_forward_cuda);
  m.impl("_ps_roi_pool_backward", PSROIPool_backward_cuda);
  m.impl("roi_align", ROIAlign_forward_cuda);
  m.impl("_roi_align_backward", ROIAlign_backward_cuda);
  m.impl("roi_pool", ROIPool_forward_cuda);
  m.impl("_roi_pool_backward", ROIPool_backward_cuda);
101
102
103
104
}
#endif

// Autocast only needs to wrap forward pass ops.
105
#if defined(WITH_CUDA) || defined(WITH_HIP)
106
TORCH_LIBRARY_IMPL(torchvision, Autocast, m) {
107
  m.impl("deform_conv2d", DeformConv2d_autocast);
108
  m.impl("nms", nms_autocast);
109
  m.impl("ps_roi_align", PSROIAlign_autocast);
110
111
112
  m.impl("ps_roi_pool", PSROIPool_autocast);
  m.impl("roi_align", ROIAlign_autocast);
  m.impl("roi_pool", ROIPool_autocast);
113
114
115
116
}
#endif

TORCH_LIBRARY_IMPL(torchvision, Autograd, m) {
117
118
  m.impl("deform_conv2d", DeformConv2d_autograd);
  m.impl("_deform_conv2d_backward", DeformConv2d_backward_autograd);
119
120
  m.impl("ps_roi_align", PSROIAlign_autograd);
  m.impl("_ps_roi_align_backward", PSROIAlign_backward_autograd);
121
122
123
124
125
126
  m.impl("ps_roi_pool", PSROIPool_autograd);
  m.impl("_ps_roi_pool_backward", PSROIPool_backward_autograd);
  m.impl("roi_align", ROIAlign_autograd);
  m.impl("_roi_align_backward", ROIAlign_backward_autograd);
  m.impl("roi_pool", ROIPool_autograd);
  m.impl("_roi_pool_backward", ROIPool_backward_autograd);
127
}