#include "op_plugin/AclOpsInterface.h"
#include "op_plugin/OpApiInterface.h"
#include "op_plugin/utils/op_api_common.h"
namespace op_api {
at::Tensor& mse_loss_out(
const at::Tensor& self,
const at::Tensor& target,
int64_t reduction,
at::Tensor& result) {
DO_COMPATIBILITY(aclnnMseLoss, acl_op::mse_loss_out(self, target, reduction, result));
at::IntArrayRef output_size;
if (reduction == at::Reduction::None) {
output_size = op_infer::broadcast_ops_npu_output_size(self, target);
}
at_npu::native::OpPreparation::check_tensor({self, target}, result, result.scalar_type(), output_size);
EXEC_NPU_CMD(aclnnMseLoss, self, target, reduction, result);
return result;
}
at::Tensor mse_loss(
const at::Tensor& self,
const at::Tensor& target,
int64_t reduction) {
DO_COMPATIBILITY(aclnnMseLoss, acl_op::mse_loss(self, target, reduction));
c10::SmallVector<int64_t, op_infer::SIZE> output_size;
if (reduction == at::Reduction::None) {
output_size = op_infer::broadcast_ops_npu_output_size(self, target);
}
at::ScalarType high_type = at::native::result_type(self, target);
at::Tensor result =
at_npu::native::OpPreparation::apply_tensor_without_format(output_size, self.options().dtype(high_type));
EXEC_NPU_CMD(aclnnMseLoss, self, target, reduction, result);
return result;
}
}