op-plugin/op_plugin/ops/aclops/QuantizeTensorKernelNpu.cpp-代码预览-op-plugin:基于昇腾Ascend Extension for PyTorch的算子插件项目 - AtomGit

7322d5de创建于 2024年8月5日历史提交
// Copyright (c) 2023 Huawei Technologies Co., Ltd
// All rights reserved.
//
// Licensed under the BSD 3-Clause License  (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// https://opensource.org/licenses/BSD-3-Clause
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "op_plugin/utils/OpAdapter.h"

#if VERSION_BETWEEN(V2R2, VERSION_NEWEST)
#include "op_plugin/AclOpsInterface.h"
#include <ATen/ops/quantize_per_tensor.h>

namespace acl_op {
double q_scale(const at::Tensor& self)
{
    return at::native::q_scale_quant(self);
}

at::Tensor q_per_channel_scales(const at::Tensor& self)
{
    return at::native::q_per_channel_scales(self);
}

int64_t q_zero_point(const at::Tensor& self)
{
    return at::native::q_zero_point_quant(self);
}

at::Tensor q_per_channel_zero_points(const at::Tensor& self)
{
    at::Tensor result = at::native::q_per_channel_zero_points(self);
    return result.to(at::Device(at::kPrivateUse1));
}

int64_t q_per_channel_axis(const at::Tensor& self)
{
    return at::native::q_per_channel_axis(self);
}

at::QScheme qscheme(const at::Tensor& self)
{
    return at::native::qscheme_quant(self);
}

at::Tensor dequantize(const at::Tensor& self)
{
    return at::native::dequantize_quantized(self);
}

at::Tensor _empty_affine_quantized(
    at::IntArrayRef size,
    c10::optional<at::ScalarType> dtype,
    c10::optional<at::Layout> layout,
    c10::optional<at::Device> device,
    c10::optional<bool> pin_memory,
    double scale,
    int64_t zero_point,
    c10::optional<c10::MemoryFormat> memory_format)
{
    return at::native::empty_affine_quantized(
        size, dtype, layout, device, pin_memory, scale, zero_point, memory_format);
}
} // namespace acl_op
#endif