#pragma once #include at::Tensor nms_3d_cpu(const at::Tensor& dets, const at::Tensor& scores, const float threshold);