nms.h 912 Bytes
Newer Older
1
#pragma once
Vasilis Vryniotis's avatar
Vasilis Vryniotis committed
2

3
#include "cpu/vision_cpu.h"
4
5

#ifdef WITH_CUDA
6
#include "autocast.h"
7
#include "cuda/vision_cuda.h"
8
#endif
9
#ifdef WITH_HIP
10
#include "autocast.h"
11
12
#include "hip/vision_cuda.h"
#endif
13

14
// nms dispatch nexus
15
16
17
at::Tensor nms(
    const at::Tensor& dets,
    const at::Tensor& scores,
Vasilis Vryniotis's avatar
Vasilis Vryniotis committed
18
    double iou_threshold) {
19
20
21
22
23
  static auto op = c10::Dispatcher::singleton()
                       .findSchemaOrThrow("torchvision::nms", "")
                       .typed<decltype(nms)>();
  return op.call(dets, scores, iou_threshold);
}
24

25
#if defined(WITH_CUDA) || defined(WITH_HIP)
26
27
28
at::Tensor nms_autocast(
    const at::Tensor& dets,
    const at::Tensor& scores,
Vasilis Vryniotis's avatar
Vasilis Vryniotis committed
29
    double iou_threshold) {
30
31
  c10::impl::ExcludeDispatchKeyGuard no_autocast(c10::DispatchKey::Autocast);
  return nms(
mcarilli's avatar
mcarilli committed
32
33
      at::autocast::cached_cast(at::kFloat, dets),
      at::autocast::cached_cast(at::kFloat, scores),
34
      iou_threshold);
35
}
36
#endif