#include "csrc/OpApiCommon.h"
#include "csrc/functions.h"
at::Tensor diff_iou_rotated_sort_vertices(const at::Tensor& vertices, const at::Tensor& mask,
const at::Tensor& num_valid)
{
TORCH_CHECK_NPU(vertices);
TORCH_CHECK_NPU(mask);
TORCH_CHECK_NPU(num_valid);
TORCH_CHECK(vertices.dim() == 4, "vertices must be a 4D Tensor, but got: ", vertices.dim());
TORCH_CHECK(mask.dim() == 3, "mask must be a 3D Tensor, but got: ", mask.dim());
TORCH_CHECK(num_valid.dim() == 2, "num_valid must be a 2D Tensor, but got: ", num_valid.dim());
uint32_t B = static_cast<uint32_t>(vertices.size(0));
uint32_t N = static_cast<uint32_t>(vertices.size(1));
at::Tensor sortedIdx = at::empty({B, N, 9}, num_valid.options());
at::Tensor mask_fp = mask.to(at::kFloat);
EXEC_NPU_CMD(aclnnDiffIouRotatedSortVertices, vertices, mask_fp, num_valid, sortedIdx);
return sortedIdx;
}