#include "op_plugin/AclOpsInterface.h"
#include "op_plugin/utils/OpAdapter.h"
namespace acl_op {
using npu_preparation = at_npu::native::OpPreparation;
void cummin_out_npu_nocheck(at::Tensor &values, at::Tensor &indices, const at::Tensor &self, int64_t dim)
{
at_npu::native::OpCommand cmd;
cmd.Name("Cummin").Input(self).Output(values).Output(indices).Attr("axis", dim).Run();
}
void _cummin_helper(const at::Tensor &self, at::Tensor &values, at::Tensor &indices, int64_t dim)
{
if (self.scalar_type() == at::kLong) {
at::Tensor values_temp = npu_preparation::apply_tensor(self);
at::Tensor indices_temp = npu_preparation::apply_tensor(self, self.options().dtype(at::kLong));
cummin_out_npu_nocheck(values_temp, indices_temp, self, dim);
values.copy_(values_temp);
indices.copy_(indices_temp);
} else {
int64_t first_dim = op_plugin::utils::make_warp_dim(0, self.dim());
if (dim != first_dim) {
c10::SmallVector<int64_t, SIZE> perm;
for (int64_t i = 0; i < self.dim(); i++) {
perm.emplace_back(i);
}
std::swap(perm[dim], perm[first_dim]);
at::Tensor transpose_self = acl_op::npu_transpose(self, perm, true);
auto output_size = op_infer::transpose_npu_output_size(values, perm);
at::Tensor transpose_value = npu_preparation::apply_tensor(self, output_size);
at::Tensor transpose_indices =
npu_preparation::apply_tensor(output_size, self.options().dtype(at::kInt), self);
cummin_out_npu_nocheck(transpose_value, transpose_indices, transpose_self, first_dim);
transpose_indices = at_npu::native::custom_ops::_npu_dtype_cast(transpose_indices, at::kLong);
acl_op::npu_transpose_out(transpose_value, perm, true, values);
acl_op::npu_transpose_out(transpose_indices, perm, true, indices);
} else {
at::Tensor values_temp = npu_preparation::apply_tensor(self);
at::Tensor indices_temp = npu_preparation::apply_tensor(self, self.options().dtype(at::kInt));
cummin_out_npu_nocheck(values_temp, indices_temp, self, dim);
indices_temp = at_npu::native::custom_ops::_npu_dtype_cast(indices_temp, at::kLong);
values.copy_(values_temp);
indices.copy_(indices_temp);
}
}
}
}