* Copyright (c) 2026 Huawei Technologies Co., Ltd.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#if !defined(ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS)
#warning \
"impl/tensor_api/arch/cube/l1_to_l0a/copy.h is an internal header file and must not be used directly. Functions or variables defined in this file maybe removed in the future. Please use "#include "tensor_api/tensor.h"" and use public functions or variables defined in interface headers files."
#define ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS
#define UNDEF_ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS_ASCENDC
#endif
* \file copy.h
* \brief
*/
#ifndef IMPL_TENSOR_API_ARCH_CUBE_L1_TO_L0A_COPY_H
#define IMPL_TENSOR_API_ARCH_CUBE_L1_TO_L0A_COPY_H
#include "impl/tensor_api/arch/cube/l1_to_l0a/routing.h"
namespace AscendC {
namespace Te {
constexpr CopyL12L0ATrait DEFAULT_COPY_L1_TO_L0A_TRAIT;
struct CopyL12L0ATraitDefault {
using TraitType = CopyL12L0ATrait;
static constexpr const TraitType value = DEFAULT_COPY_L1_TO_L0A_TRAIT;
};
using CopyL12L0AModeSet = TupleMap<
Std::tuple<Std::tuple<_1, _0>, CopyMode::NORMAL>,
Std::tuple<Std::tuple<_1, _1>, CopyMode::NORMAL>,
Std::tuple<Std::tuple<_0, _0>, CopyMode::TRANS>,
Std::tuple<Std::tuple<_0, _1>, CopyMode::TRANS_B8B4>>;
using CopyL12L0AModeCoordSet = TupleMap<
Std::tuple<Std::tuple<_1, _0>, CopyMode::NORMAL_COORD>,
Std::tuple<Std::tuple<_1, _1>, CopyMode::NORMAL_COORD>,
Std::tuple<Std::tuple<_0, _0>, CopyMode::TRANS_COORD>,
Std::tuple<Std::tuple<_0, _1>, CopyMode::TRANS_B8B4_COORD>>;
struct CopyL12L0A {
public:
template <typename Tp, const Tp& traits, typename... Args>
__aicore__ inline static void Copy(const Args& ...args)
{
if ASCEND_IS_AIC {
LoadData<traits, Args...>(args...);
}
}
private:
template<const CopyL12L0ATrait& trait = DEFAULT_COPY_L1_TO_L0A_TRAIT, typename T, typename U>
__aicore__ inline static void LoadData(const T& dst, const U& src)
{
using dstPos = GetMemLocation<T>;
using srcPos = GetMemLocation<U>;
using DstLayout = typename T::layoutType;
using SrcLayout = typename U::layoutType;
using DstPattern = GetLayoutPattern<DstLayout>;
using SrcPattern = GetLayoutPattern<SrcLayout>;
constexpr auto isB8B4Type = sizeof(typename T::elementType) == 1;
constexpr auto noTrans = Std::is_same_v<DstPattern, SrcPattern>;
using CopyL12L0AMode = typename CopyL12L0AModeSet::template Get<Std::tuple<Std::Int<noTrans>, Std::Int<isB8B4Type>>>;
static_assert(!Std::is_same_v<CopyL12L0AMode, Std::ignore_t>, "Unsupported CopyL12L0AMode.");
using Tensor2Tensor = typename CopyL12L0ATensor2Tensor<dstPos, srcPos, CURRENT_ARCH_VERSION, DstPattern, SrcPattern, CopyL12L0AMode>::type;
Tensor2Tensor::template Run<trait, T, U>(dst, src);
}
template<const CopyL12L0ATrait& trait = DEFAULT_COPY_L1_TO_L0A_TRAIT, typename T, typename U, class Coord>
__aicore__ inline static void LoadData(const T& dst, const U& src, const Coord& coord)
{
using dstPos = GetMemLocation<T>;
using srcPos = GetMemLocation<U>;
using DstLayout = typename T::layoutType;
using SrcLayout = typename U::layoutType;
using DstPattern = GetLayoutPattern<DstLayout>;
using SrcPattern = GetLayoutPattern<SrcLayout>;
constexpr auto isB8B4Type = sizeof(typename T::elementType) == 1;
constexpr auto noTrans = Std::is_same_v<DstPattern, SrcPattern>;
using CopyL12L0AMode = typename CopyL12L0AModeCoordSet::template Get<Std::tuple<Std::Int<noTrans>, Std::Int<isB8B4Type>>>;
static_assert(!Std::is_same_v<CopyL12L0AMode, Std::ignore_t>, "Unsupported CopyL12L0ACoordMode.");
using Tensor2Tensor = typename CopyL12L0ATensor2Tensor<dstPos, srcPos, CURRENT_ARCH_VERSION, DstPattern, SrcPattern, CopyL12L0AMode>::type;
Tensor2Tensor::template Run<trait, T, U, Coord>(dst, src, coord);
}
};
}
}
#endif
#if defined(UNDEF_ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS_ASCENDC)
#undef ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS
#undef UNDEF_ASCENDC_TENSOR_API_INCLUDE_COMPILER_INTERNAL_HEADERS_ASCENDC
#endif