#include "op_plugin/AclOpsInterface.h"
#include "op_plugin/utils/OpAdapter.h"
namespace acl_op {
using npu_preparation = at_npu::native::OpPreparation;
#if VERSION_BETWEEN(V1R11, V2R7)
at::Tensor hardswish_backward(const at::Tensor& grad_output, const at::Tensor& self)
{
at::Tensor grad_input = npu_preparation::apply_tensor(grad_output);
at_npu::native::OpCommand cmd;
cmd.Name("HardSwishGrad")
.Input(grad_output)
.Input(self)
.Output(grad_input)
.Run();
return grad_input;
}
#endif
#if VERSION_BETWEEN(V2R8, VERSION_NEWEST)
at::Tensor hardswish_backward(const at::Tensor& grad_output, const at::Tensor& self)
{
at::Tensor grad_input = npu_preparation::apply_tensor(grad_output);
at_npu::native::OpCommand cmd;
cmd.Name("HardSwishGrad")
.Input(grad_output)
.Input(self)
.Output(grad_input)
.Run();
at::Tensor values_le3 = at::empty({}, self.options());
at::Tensor values_ge3 = at::empty({}, self.options());
acl_op::fill_(values_le3, 0.0f);
acl_op::fill_(values_ge3, 1.0f);
grad_input.index_put_({self.eq(-3.0f)}, values_le3);
grad_input.index_put_({self.eq(3.0f)}, values_ge3);
return grad_input;
}
#endif
}