open-mmlab · ZwwWayne · Mar 17, 2021 · Mar 12, 2021 · Mar 15, 2021 · ZwwWayne
diff --git a/mmdet3d/ops/__init__.py b/mmdet3d/ops/__init__.py
@@ -9,6 +9,7 @@
 from .group_points import (GroupAll, QueryAndGroup, group_points,
  grouping_operation)
 from .interpolate import three_interpolate, three_nn
+from .knn import knn
 from .norm import NaiveSyncBatchNorm1d, NaiveSyncBatchNorm2d
 from .pointnet_modules import (PointFPModule, PointSAModule, PointSAModuleMSG,
  build_sa_module)
@@ -25,7 +26,7 @@
  'dynamic_scatter', 'DynamicScatter', 'sigmoid_focal_loss',
  'SigmoidFocalLoss', 'SparseBasicBlock', 'SparseBottleneck',
  'RoIAwarePool3d', 'points_in_boxes_gpu', 'points_in_boxes_cpu',
- 'make_sparse_convmodule', 'ball_query', 'furthest_point_sample',
+ 'make_sparse_convmodule', 'ball_query', 'knn', 'furthest_point_sample',
  'furthest_point_sample_with_dist', 'three_interpolate', 'three_nn',
  'gather_points', 'grouping_operation', 'group_points', 'GroupAll',
  'QueryAndGroup', 'PointSAModule', 'PointSAModuleMSG', 'PointFPModule',

diff --git a/mmdet3d/ops/gather_points/gather_points.py b/mmdet3d/ops/gather_points/gather_points.py
@@ -12,28 +12,28 @@ class GatherPoints(Function):
 
  @staticmethod
  def forward(ctx, features: torch.Tensor,
- indicies: torch.Tensor) -> torch.Tensor:
+ indices: torch.Tensor) -> torch.Tensor:
  """forward.
 
  Args:
  features (Tensor): (B, C, N) features to gather.
- indicies (Tensor): (B, M) where M is the number of points.
+ indices (Tensor): (B, M) where M is the number of points.
 
  Returns:
  Tensor: (B, C, M) where M is the number of points.
  """
  assert features.is_contiguous()
- assert indicies.is_contiguous()
+ assert indices.is_contiguous()
 
- B, npoint = indicies.size()
+ B, npoint = indices.size()
  _, C, N = features.size()
  output = torch.cuda.FloatTensor(B, C, npoint)
 
  gather_points_ext.gather_points_wrapper(B, C, N, npoint, features,
- indicies, output)
+ indices, output)
 
- ctx.for_backwards = (indicies, C, N)
- ctx.mark_non_differentiable(indicies)
+ ctx.for_backwards = (indices, C, N)
+ ctx.mark_non_differentiable(indices)
  return output
 
  @staticmethod

diff --git a/mmdet3d/ops/knn/__init__.py b/mmdet3d/ops/knn/__init__.py
@@ -0,0 +1,3 @@
+from .knn import knn
+
+__all__ = ['knn']
diff --git a/mmdet3d/ops/knn/knn.py b/mmdet3d/ops/knn/knn.py
@@ -0,0 +1,68 @@
+import torch
+from torch.autograd import Function
+
+from . import knn_ext
+
+
+class KNN(Function):
+ """KNN (CUDA).
+
+ Find k-nearest points.
+ """
+
+ @staticmethod
+ def forward(ctx,
+ k: int,
+ xyz: torch.Tensor,
+ center_xyz: torch.Tensor,
+ transposed: bool = False) -> torch.Tensor:
+ """forward.
+
+ Args:
+ k (int): number of nearest neighbors.
+ xyz (Tensor): (B, N, 3) if transposed == False, else (B, 3, N).
+ xyz coordinates of the features.
+ center_xyz (Tensor): (B, npoint, 3) if transposed == False,
+ else (B, 3, npoint). centers of the knn query.
+ transposed (bool): whether the input tensors are transposed.
+ defaults to False.
+
+ Returns:
+ Tensor: (B, k, npoint) tensor with the indicies of
+ the features that form k-nearest neighbours.
+ """
+ assert k > 0
+
+ B, npoint = center_xyz.shape[:2]
+ N = xyz.shape[1]
+
+ if not transposed:
+ xyz = xyz.transpose(2, 1).contiguous()
+ center_xyz = center_xyz.transpose(2, 1).contiguous()
+
+ assert center_xyz.is_contiguous()
+ assert xyz.is_contiguous()
+
+ center_xyz_device = center_xyz.get_device()
+ assert center_xyz_device == xyz.get_device(), \
+ 'center_xyz and xyz should be put on the same device'
+ if torch.cuda.current_device() != center_xyz_device:
+ torch.cuda.set_device(center_xyz_device)
+
+ idx = center_xyz.new_zeros((B, k, npoint)).long()
+
+ for bi in range(B):
+ knn_ext.knn_wrapper(xyz[bi], N, center_xyz[bi], npoint, idx[bi], k)
+
+ ctx.mark_non_differentiable(idx)
+
+ idx -= 1
+
+ return idx
+
+ @staticmethod
+ def backward(ctx, a=None):
+ return None, None
+
+
+knn = KNN.apply
diff --git a/mmdet3d/ops/knn/src/knn.cpp b/mmdet3d/ops/knn/src/knn.cpp
@@ -0,0 +1,62 @@
+// Modified from https://github.com/unlimblue/KNN_CUDA
+
+#include <vector>
+#include <torch/extension.h>
+#include <ATen/cuda/CUDAContext.h>
+
+#define CHECK_CONTIGUOUS(x) AT_ASSERTM(x.is_contiguous(), #x " must be contiguous")
+#define CHECK_TYPE(x, t) AT_ASSERTM(x.dtype() == t, #x " must be " #t)
+#define CHECK_CUDA(x) AT_ASSERTM(x.device().type() == at::Device::Type::CUDA, #x " must be on CUDA")
+#define CHECK_INPUT(x, t) CHECK_CONTIGUOUS(x); CHECK_TYPE(x, t); CHECK_CUDA(x)
+
+
+void knn_kernels_launcher(
+ const float* ref_dev,
+ int ref_nb,
+ const float* query_dev,
+ int query_nb,
+ int dim,
+ int k,
+ float* dist_dev,
+ long* ind_dev,
+ cudaStream_t stream
+ );
+
+// std::vector<at::Tensor> knn_wrapper(
+void knn_wrapper(
+ at::Tensor & ref,
+ int ref_nb,
+ at::Tensor & query,
+ int query_nb,
+ at::Tensor & ind,
+ const int k
+ ) {
+
+ CHECK_INPUT(ref, at::kFloat);
+ CHECK_INPUT(query, at::kFloat);
+ const float * ref_dev = ref.data_ptr<float>();
+ const float * query_dev = query.data_ptr<float>();
+ int dim = query.size(0);
+ auto dist = at::empty({ref_nb, query_nb}, query.options().dtype(at::kFloat));
+ float * dist_dev = dist.data_ptr<float>();
+ long * ind_dev = ind.data_ptr<long>();
+
+ cudaStream_t stream = at::cuda::getCurrentCUDAStream();
+
+ knn_kernels_launcher(
+ ref_dev,
+ ref_nb,
+ query_dev,
+ query_nb,
+ dim,
+ k,
+ dist_dev,
+ ind_dev,
+ stream
+ );
+}
+
+
+PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
+ m.def("knn_wrapper", &knn_wrapper, "knn_wrapper");
+}