* Copyright (c) 2025 Huawei Technologies Co., Ltd.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#include <cmath>
#include <random>
#include "gtest/gtest.h"
#include "tikicpulib.h"
#include "test_api_utils.h"
#include "bitwise_and.h"
using namespace AscendC;
template <typename T>
struct TensorBitwiseAndInputParam {
T *y{};
T *exp{};
T *src0{};
T *src1{};
uint32_t size{0};
uint32_t out_size{0};
};
class TestApiBitwiseAnd : public testing::Test {
protected:
template <typename T>
static void InvokeKernelWithTwoTensorInput(TensorBitwiseAndInputParam<T> ¶m) {
TPipe tpipe;
TBuf<TPosition::VECCALC> x1buf, x2buf, ybuf, tmp;
tpipe.InitBuffer(x1buf, sizeof(T) * param.size);
tpipe.InitBuffer(x2buf, sizeof(T) * param.size);
tpipe.InitBuffer(ybuf, sizeof(T) * AlignUp(param.size, ONE_BLK_SIZE / sizeof(T)));
tpipe.InitBuffer(tmp, 32);
LocalTensor<T> l_x1 = x1buf.Get<T>();
LocalTensor<T> l_x2 = x2buf.Get<T>();
LocalTensor<T> l_y = ybuf.Get<T>();
LocalTensor<uint8_t> l_tmp = tmp.Get<uint8_t>();
GmToUb(l_x1, param.src0, param.size);
GmToUb(l_x2, param.src1, param.size);
BitwiseAndExtend(l_y, l_x1, l_x2, l_tmp, param.size);
UbToGm(param.y, l_y, param.size);
}
template <typename T>
static void CreateTensorInput(TensorBitwiseAndInputParam<T> ¶m) {
param.y = static_cast<T *>(AscendC::GmAlloc(sizeof(T) * param.size));
param.exp = static_cast<T *>(AscendC::GmAlloc(sizeof(T) * param.size));
param.src0 = static_cast<T *>(AscendC::GmAlloc(sizeof(T) * param.size));
param.src1 = static_cast<T *>(AscendC::GmAlloc(sizeof(T) * param.size));
int input_range = 1;
std::mt19937 eng(1);
std::uniform_int_distribution distr(0, input_range);
std::mt19937 eng1(3);
std::uniform_int_distribution distr1(0, input_range);
for (int i = 0; i < param.size; i++) {
T input = distr(eng);
T input1 = distr1(eng1);
if (std::is_same_v<T, uint8_t>) {
input = input != 0;
input1 = input1 != 0;
}
param.src0[i] = input;
param.src1[i] = input1;
param.exp[i] = input & input1;
}
}
template <typename T>
static uint32_t Valid(T *y, T *exp, size_t comp_size) {
uint32_t diff_count = 0;
for (uint32_t i = 0; i < comp_size; i++) {
if (y[i] != exp[i]) {
diff_count++;
}
}
return diff_count;
}
template <typename T>
static void BitwiseAndTest(uint32_t size) {
TensorBitwiseAndInputParam<T> param{};
param.size = size;
CreateTensorInput(param);
auto kernel = [¶m] { InvokeKernelWithTwoTensorInput(param); };
AscendC::SetKernelMode(KernelMode::AIV_MODE);
ICPU_RUN_KF(kernel, 1);
uint32_t diff_count = Valid(param.y, param.exp, param.size);
EXPECT_EQ(diff_count, 0);
AscendC::GmFree(param.y);
AscendC::GmFree(param.exp);
AscendC::GmFree(param.src0);
AscendC::GmFree(param.src1);
}
};
TEST_F(TestApiBitwiseAnd, BitwiseAnd_Test) {
BitwiseAndTest<int16_t>(ONE_BLK_SIZE / sizeof(int16_t));
BitwiseAndTest<int16_t>(ONE_REPEAT_BYTE_SIZE / sizeof(int16_t));
BitwiseAndTest<int16_t>(MAX_REPEAT_NUM *ONE_REPEAT_BYTE_SIZE / sizeof(int16_t));
BitwiseAndTest<int16_t>((ONE_BLK_SIZE - sizeof(int16_t)) / sizeof(int16_t));
BitwiseAndTest<int16_t>((ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) / sizeof(int16_t));
BitwiseAndTest<int16_t>((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE / sizeof(int16_t));
BitwiseAndTest<int16_t>(((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE + (ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) + (ONE_BLK_SIZE - sizeof(int16_t))) /sizeof(int16_t));
BitwiseAndTest<int64_t>(ONE_BLK_SIZE / sizeof(int64_t));
BitwiseAndTest<int64_t>(ONE_REPEAT_BYTE_SIZE / sizeof(int64_t));
BitwiseAndTest<int64_t>(MAX_REPEAT_NUM *ONE_REPEAT_BYTE_SIZE / sizeof(int64_t));
BitwiseAndTest<int64_t>((ONE_BLK_SIZE - sizeof(int64_t)) / sizeof(int64_t));
BitwiseAndTest<int64_t>((ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) / sizeof(int64_t));
BitwiseAndTest<int64_t>((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE / sizeof(int64_t));
BitwiseAndTest<int64_t>(((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE + (ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) + (ONE_BLK_SIZE - sizeof(int64_t))) /sizeof(int64_t));
BitwiseAndTest<uint8_t>(ONE_BLK_SIZE / sizeof(uint8_t));
BitwiseAndTest<uint8_t>(ONE_REPEAT_BYTE_SIZE / sizeof(uint8_t));
BitwiseAndTest<uint8_t>(MAX_REPEAT_NUM *ONE_REPEAT_BYTE_SIZE / sizeof(uint8_t));
BitwiseAndTest<uint8_t>((ONE_BLK_SIZE - sizeof(uint8_t)) / sizeof(uint8_t));
BitwiseAndTest<uint8_t>((ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) / sizeof(uint8_t));
BitwiseAndTest<uint8_t>((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE / sizeof(uint8_t));
BitwiseAndTest<uint8_t>(((MAX_REPEAT_NUM - 1) * ONE_REPEAT_BYTE_SIZE + (ONE_REPEAT_BYTE_SIZE - ONE_BLK_SIZE) + (ONE_BLK_SIZE - sizeof(uint8_t))) /sizeof(uint8_t));
}