* Copyright (c) 2025 Huawei Technologies Co., Ltd.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#include "broadcast_auto_selector.h"
#include "selector_registry.h"
#include "hccl_aiv_utils.h"
namespace ops_hccl {
constexpr u32 TOPO_LEVEL_NUM_3 = 3;
SelectorStatus BroadcastAutoSelector::SelectCcuMsAlgo(const TopoInfoWithNetLayerDetails* topoInfo, const OpParam &opParam,
const std::map<HcclCMDType, std::vector<HcclAlgoType>> &configAlgMap,
std::string &selectAlgName) const
{
(void)configAlgMap;
HCCL_DEBUG("[BroadcastAutoSelector][%s] start, topoInfo levelNum[%u]", __func__, topoInfo->topoLevelNums);
if (topoInfo->topoLevelNums > 1) {
HCCL_WARNING("[Algo][BroadcastAutoSelector] levelNum > 1 is not supported yet for ccu_ms mode.");
return SelectorStatus::NOT_MATCH;
} else {
return SelectMeshAlgoCcuMs(topoInfo, opParam, selectAlgName);
}
}
SelectorStatus BroadcastAutoSelector::SelectMeshAlgoCcuMs(const TopoInfoWithNetLayerDetails* topoInfo, const OpParam &opParam,
std::string &selectAlgName) const
{
(void)opParam;
if (topoInfo->level0Topo == Level0Shape::MESH_1D) {
if (topoInfo->is2DieFullMesh) {
HCCL_WARNING("[BroadcastAutoSelector] 2DieFullMesh is not supported yet for schedule mode.");
return SelectorStatus::NOT_MATCH;
} else {
selectAlgName = "CcuBroadcastMesh1D";
}
} else if (topoInfo->level0Topo == Level0Shape::MESH_1D_CLOS) {
if (IsLayerAllConnetedWithTopo(topoInfo, 0, CommTopo::COMM_TOPO_1DMESH)) {
selectAlgName = "CcuBroadcastMesh1D";
} else {
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu_ms mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
}
} else if (topoInfo->level0Topo == Level0Shape::CLOS){
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu_ms mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
} else {
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu_ms mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
}
HCCL_INFO("[BroadcastAutoSelector][%s] Algo match [%s]", __func__, selectAlgName.c_str());
return SelectorStatus::MATCH;
}
SelectorStatus BroadcastAutoSelector::SelectCcuScheduleAlgo(const TopoInfoWithNetLayerDetails* topoInfo,
const OpParam &opParam,
const std::map<HcclCMDType, std::vector<HcclAlgoType>> &configAlgMap,
std::string &selectAlgName) const
{
(void)opParam;
(void)configAlgMap;
HCCL_DEBUG("[BroadcastAutoSelector][%s] start, topoInfo levelNum[%u]", __func__, topoInfo->topoLevelNums);
if (topoInfo->topoLevelNums > 1) {
if (topoInfo->level0Topo == Level0Shape::MESH_1D) {
if(topoInfo->netLayerDetails.localNetInsSizeOfLayer[0] == 1){
selectAlgName = "CcuBroadcastNHR1DMem2Mem";
} else if (topoInfo->is2DieFullMesh) {
HCCL_WARNING("[BroadcastAutoSelector] 2DieFullMesh is not supported yet for ccu schedule mode.");
return SelectorStatus::NOT_MATCH;
} else {
selectAlgName = "CcuBroadcastParallelMesh1DNHR";
}
} else {
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu schedule mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
}
} else {
if (topoInfo->level0Topo == Level0Shape::MESH_1D) {
if (topoInfo->is2DieFullMesh) {
HCCL_WARNING("[BroadcastAutoSelector] 2DieFullMesh is not supported yet for ccu schedule mode.");
return SelectorStatus::NOT_MATCH;
} else {
selectAlgName = "CcuBroadcastMesh1DMem2Mem";
}
} else if (topoInfo->level0Topo == Level0Shape::MESH_1D_CLOS) {
if (IsLayerAllConnetedWithTopo(topoInfo, 0, CommTopo::COMM_TOPO_1DMESH)) {
selectAlgName = "CcuBroadcastMesh1DMem2Mem";
} else if (topoInfo->level0PcieMix) {
HCCL_WARNING("[BroadcastAutoSelector] pcie mixed topo is not supported yet for ccu schedule mode.");
return SelectorStatus::NOT_MATCH;
} else {
selectAlgName = "CcuBroadcastParallelMesh1DNHRUBX";
}
} else if (topoInfo->level0Topo == Level0Shape::CLOS) {
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu schedule mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
} else {
HCCL_WARNING("[Algo][BroadcastAutoSelector] level0Shape[%d] is not supported yet for ccu schedule mode.",
topoInfo->level0Topo);
return SelectorStatus::NOT_MATCH;
}
}
HCCL_INFO("[BroadcastAutoSelector][%s] Algo match [%s]", __func__, selectAlgName.c_str());
return SelectorStatus::MATCH;
}
SelectorStatus BroadcastAutoSelector::SelectAicpuAlgo(const TopoInfoWithNetLayerDetails* topoInfo,
const OpParam &opParam,
const std::map<HcclCMDType, std::vector<HcclAlgoType>> &configAlgMap,
std::string &selectAlgName) const
{
(void)configAlgMap;
HCCL_DEBUG("[BroadcastAutoSelector][%s] start, topoInfo levelNum[%u]", __func__, topoInfo->topoLevelNums);
if (topoInfo->topoLevelNums > 1) {
if (topoInfo->topoLevelNums == TOPO_LEVEL_NUM_3) {
if (topoInfo->netLayerDetails.localNetInsSizeOfLayer[1] == 1) {
selectAlgName = "InsBroadcastNHR";
} else {
selectAlgName = "InsBroadcastParallelNHRNHRUboe";
}
} else if (topoInfo->netLayerDetails.localNetInsSizeOfLayer[0] == 1) {
selectAlgName = "InsBroadcastNHR";
} else if (topoInfo->level0Topo == Level0Shape::MESH_1D) {
selectAlgName = "InsBroadcastParallelMesh1DNHR";
} else if (topoInfo->level0Topo == Level0Shape::CLOS) {
selectAlgName = "InsBroadcastNHR";
} else {
HCCL_WARNING("[BroadcastAutoSelector] topo not match");
return SelectorStatus::NOT_MATCH;
}
} else {
return SelectMeshAlgoAicpu(topoInfo, opParam, selectAlgName);
}
HCCL_INFO("[BroadcastAutoSelector][%s] Algo match [%s]", __func__, selectAlgName.c_str());
return SelectorStatus::MATCH;
}
SelectorStatus BroadcastAutoSelector::SelectMeshAlgoAicpu(const TopoInfoWithNetLayerDetails* topoInfo, const OpParam &opParam,
std::string &selectAlgName) const
{
if (topoInfo->level0Topo == Level0Shape::MESH_1D) {
selectAlgName = "InsBroadcastMesh1DTwoShot";
} else if (topoInfo->level0Topo == Level0Shape::MESH_1D_CLOS) {
if (IsLayerAllConnetedWithTopo(topoInfo, 0, CommTopo::COMM_TOPO_1DMESH)) {
selectAlgName = "InsBroadcastMesh1DTwoShot";
} else if (topoInfo->level0PcieMix) {
selectAlgName = "InsBroadcastParallelMesh1DNHRPcie";
} else {
selectAlgName = "InsBroadcastParallelMesh1DNHRUBX";
}
} else if (topoInfo->level0Topo == Level0Shape::CLOS) {
selectAlgName = "InsBroadcastNHR";
} else {
HCCL_WARNING("[BroadcastAutoSelector] topo not match");
return SelectorStatus::NOT_MATCH;
}
HCCL_INFO("[BroadcastAutoSelector][%s] Algo match [%s]", __func__, selectAlgName.c_str());
return SelectorStatus::MATCH;
}
SelectorStatus BroadcastAutoSelector::SelectAivAlgo(const TopoInfoWithNetLayerDetails* topoInfo, const OpParam &opParam,
const std::map<HcclCMDType, std::vector<HcclAlgoType>> &configAlgMap,
std::string &selectAlgName) const
{
(void)opParam;
(void)configAlgMap;
std::vector<HcclAlgoType> algos = std::vector<HcclAlgoType>(HCCL_ALGO_LEVEL_NUM, HcclAlgoType::HCCL_ALGO_TYPE_DEFAULT);
if (topoInfo->userRankSize > MAX_RANK_SIZE_V) {
HCCL_DEBUG("[BroadcastAutoSelector][%s] rankSize[%u] larger than [%u]", __func__, topoInfo->userRankSize, MAX_RANK_SIZE);
return SelectorStatus::NOT_MATCH;
}
void *cclBufferAddr;
uint64_t cclBufferSize;
CHK_PRT_RET(HcclGetHcclBuffer(opParam.hcclComm, &cclBufferAddr, &cclBufferSize) != HCCL_SUCCESS,
HCCL_WARNING("[BroadcastAutoSelector] HcclGetHcclBuffer failed."), SelectorStatus::NOT_MATCH);
u64 perDataSize = DATATYPE_SIZE_TABLE[opParam.DataDes.dataType];
u64 dataSize = opParam.DataDes.count * perDataSize;
if (dataSize > cclBufferSize * AIV_MAX_CCL_LOOP_NUM) {
HCCL_DEBUG("[BroadcastAutoSelector][%s] dataSize[%llu] too large for cclBufferSize [%llu]", __func__, dataSize, cclBufferSize);
return SelectorStatus::NOT_MATCH;
}
selectAlgName = "AivBroadcastMesh1D";
HCCL_INFO("[BroadcastAutoSelector][%s] Algo match [%s]", __func__, selectAlgName.c_str());
return SelectorStatus::MATCH;
}
SelectorStatus BroadcastAutoSelector::SelectDPUAlgo(const TopoInfoWithNetLayerDetails *topoInfo, const OpParam &opParam,
const std::map<HcclCMDType, std::vector<HcclAlgoType>> &configAlgMap,
std::string &selectAlgName) const
{
std::vector<HcclAlgoType> algos =
std::vector<HcclAlgoType>(HCCL_ALGO_LEVEL_NUM, HcclAlgoType::HCCL_ALGO_TYPE_DEFAULT);
auto it = configAlgMap.find(opParam.opType);
if ((it != configAlgMap.end()) && (it->second.size() > 1)) {
algos = it->second;
}
HCCL_INFO("hccl algo op config: config opType:%d, level0:%u, level1:%u, level2:%u, level3:%u", opParam.opType,
algos[0], algos[1], algos[2], algos[3]);
if (topoInfo->topoLevelNums > 1) {
if ((topoInfo->deviceNumPerModule == 1) || (topoInfo->level0Topo == Level0Shape::MESH_1D)) {
selectAlgName = "InsBroadcastSequenceMeshNhrDPU";
return SelectorStatus::MATCH;
}
}
return SelectorStatus::NOT_MATCH;
}
REGISTER_SELECTOR_BY_OPTYPE(HcclCMDType::HCCL_CMD_BROADCAST, 18, BroadcastAutoSelector);
}