* Copyright (c) 2025 Huawei Technologies Co., Ltd.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#ifndef COMMON_H
#define COMMON_H
#include "adapter_hccp_common.h"
#include "hccl_ip_address.h"
#include "hccl_common.h"
#include "alg_cmd_type.h"
#include "transport_pub.h"
#include "externalinput_pub.h"
#include "template_v1_utils.h"
#include "comm_utils.h"
constexpr s64 HCCL_SUB_STREAM_NUM_ZERO = 0;
constexpr s64 HCCL_SUB_STREAM_NUM_DOUBLE_RING = 1;
constexpr s64 HCCL_SUB_STREAM_NUM_4P_MESH = 2;
constexpr s64 HCCL_SUB_STREAM_NUM_8P_RING = 3;
constexpr s64 HCCL_SUB_STREAM_NP_MESH = 2;
enum class HcclAlgoType {
HCCL_ALGO_TYPE_DEFAULT = 0,
HCCL_ALGO_TYPE_RING,
HCCL_ALGO_TYPE_PIPELINE,
HCCL_ALGO_TYPE_FULLMESH,
HCCL_ALGO_TYPE_HDR,
HCCL_ALGO_TYPE_PAIRWISE,
HCCL_ALGO_TYPE_NHR,
HCCL_ALGO_TYPE_NHR_V1,
HCCL_ALGO_TYPE_NB,
HCCL_ALGO_TYPE_NULL,
HCCL_ALGO_TYPE_NA,
HCCL_ALGO_TYPE_AHC,
HCCL_ALGO_TYPE_AHC_BROKE,
};
enum class AlgTypeLevel0 {
ALG_LEVEL0_WHOLE_RING = 0,
ALG_LEVEL0_8P_RING,
ALG_LEVEL0_4P_MESH,
ALG_LEVEL0_2P_MESH,
ALG_LEVEL0_1P_MESH,
ALG_LEVEL0_4P_RING,
ALG_LEVEL0_NP_SINGLE_RING,
ALG_LEVEL0_NP_DOUBLE_RING,
ALG_LEVEL0_NP_MESH,
ALG_LEVEL0_NP_HD,
ALG_LEVEL0_NP_STAR,
ALG_LEVEL0_PAIRWISE,
ALG_LEVEL0_RESERVED
};
enum class AlgTypeLevel1 {
ALG_LEVEL1_WHOLE_RING = 0,
ALG_LEVEL1_HD,
ALG_LEVEL1_RING,
ALG_LEVEL1_PIPELINE,
ALG_LEVEL1_STAR,
ALG_LEVEL1_NHR,
ALG_LEVEL1_NHR_V1,
ALG_LEVEL1_NB,
ALG_LEVEL1_AHC,
ALG_LEVEL1_AHC_BROKE,
ALG_LEVEL1_RESERVED
};
enum class AlgTypeLevel2 {
ALG_LEVEL2_WHOLE_RING = 0,
ALG_LEVEL2_HD,
ALG_LEVEL2_RING,
ALG_LEVEL2_NHR,
ALG_LEVEL2_NB,
ALG_LEVEL2_PIPELINE,
ALG_LEVEL2_RESERVED
};
using AlgType = struct TagAlgType {
AlgTypeLevel0 algoLevel0;
AlgTypeLevel1 algoLevel1;
AlgTypeLevel2 algoLevel2;
TagAlgType() : algoLevel0(AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING), algoLevel1(AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING),
algoLevel2(AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING)
{
}
explicit TagAlgType(AlgTypeLevel0 algoLevel0) : algoLevel0(algoLevel0), algoLevel1(AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING),
algoLevel2(AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING)
{
}
TagAlgType(AlgTypeLevel0 algoLevel0, AlgTypeLevel1 algoLevel1) : algoLevel0(algoLevel0),
algoLevel1(algoLevel1), algoLevel2(AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING)
{
}
TagAlgType(AlgTypeLevel0 algoLevel0, AlgTypeLevel2 algoLevel2) : algoLevel0(algoLevel0),
algoLevel1(AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING), algoLevel2(algoLevel2)
{
}
TagAlgType(AlgTypeLevel0 algoLevel0, AlgTypeLevel1 algoLevel1, AlgTypeLevel2 algoLevel2) : algoLevel0(algoLevel0),
algoLevel1(algoLevel1), algoLevel2(algoLevel2)
{
}
explicit TagAlgType(AlgTypeLevel1 algoLevel1) : algoLevel0(AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING), algoLevel1(algoLevel1),
algoLevel2(AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING)
{
}
TagAlgType(AlgTypeLevel1 algoLevel1, AlgTypeLevel2 algoLevel2) : algoLevel0(AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING),
algoLevel1(algoLevel1), algoLevel2(algoLevel2)
{
}
explicit TagAlgType(AlgTypeLevel2 algoLevel2) : algoLevel0(AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING),
algoLevel1(AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING), algoLevel2(algoLevel2)
{
}
static TagAlgType Reserved() {
return TagAlgType(AlgTypeLevel0::ALG_LEVEL0_RESERVED, AlgTypeLevel1::ALG_LEVEL1_RESERVED, AlgTypeLevel2::ALG_LEVEL2_RESERVED);
}
TagAlgType(const TagAlgType &that) : algoLevel0(that.algoLevel0), algoLevel1(that.algoLevel1), algoLevel2(that.algoLevel2)
{
}
TagAlgType &operator=(const TagAlgType &that)
{
if (&that != this) {
algoLevel0 = that.algoLevel0;
algoLevel1 = that.algoLevel1;
algoLevel2 = that.algoLevel2;
}
return *this;
}
};
namespace hccl {
using RankInfo = struct TagRankInfo {
public:
u32 userRank{INVALID_UINT};
u32 worldRank{INVALID_UINT};
u32 localRank{INVALID_UINT};
s32 devicePhyId{-1};
DevType deviceType{DevType::DEV_TYPE_NOSOC};
std::vector<HcclIpAddress> nicIp;
std::vector<HcclIpAddress> backupNicIp;
u32 deviceNicPort{HCCL_INVALID_PORT};
u32 deviceVnicPort{HCCL_INVALID_PORT};
u32 backupDevicePort{HCCL_INVALID_PORT};
std::vector<u32> nicIdx;
NICDeployment nicDeploy{NICDeployment::NIC_DEPLOYMENT_DEVICE};
HcclIpAddress hostIp;
u32 hostPort{HCCL_INVALID_PORT};
std::string serverId{""};
u32 serverIdx{INVALID_UINT};
u32 superDeviceId{INVALID_UINT};
std::string superPodId{""};
u32 superPodIdx{INVALID_UINT};
HcclIpAddress deviceVnicIp;
};
constexpr s64 HCCL_SMALL_COUNT_128_KB = 128 * 1024;
constexpr s64 HCCL_SMALL_COUNT_GRAPH_64_KB = 64 * 1024;
constexpr s64 HCCL_MEDIUM_COUNT_GRAPH_4_MB = 4 * 1024 * 1024;
constexpr s64 HCCL_SMALL_COUNT_256_KB = 256 * 1024;
constexpr s64 HCCL_ALIGN_COUNT_32_B = 32;
constexpr s64 HCCL_SMALL_COUNT_190_KB = 190 * 1024;
constexpr s64 HCCL_SMALL_COUNT_512_KB = 512 * 1024;
constexpr s64 HCCL_SMALL_COUNT_1_MB = 1024 * 1024;
constexpr s64 HCCL_SMALL_COUNT_2_MB = 2048 * 1024;
constexpr s64 HCCL_SMALL_COUNT_4_MB = 4096 * 1024;
constexpr s64 HCCL_SMALL_COUNT_8_MB = 8192 * 1024;
constexpr s64 HCCL_SMALL_COUNT_16_KB = 16 * 1024;
constexpr s64 HCCL_MID_COUNT_16_MB = 16 * 1024 * 1024;
constexpr s64 HCCL_MID_COUNT_32_MB = 32 * 1024 * 1024;
constexpr u32 HCCL_INTER_SERVER_RING_ALGO_MAX_SUPPORT_SERVER_NUM = 8;
constexpr u32 HCCL_ALLTOALLV_P2P_SIZE = 2;
constexpr u32 HCCL_MEMSIZE_HD_FACTOR = 4;
const std::string HCCL_ALLTOALL_PARA_ALLGATHER = "AllgatherForCollectA2APara";
const std::string HCCL_MC2_MULTISERVER_SUFFIX = "_MC2MultiServer";
const std::map<AlgTypeLevel0, std::string> HCCL_ALGO_LEVEL0_NAME_MAP = {
{AlgTypeLevel0::ALG_LEVEL0_NP_DOUBLE_RING, "ring"},
{AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING, "ring"},
{AlgTypeLevel0::ALG_LEVEL0_8P_RING, "ring"},
{AlgTypeLevel0::ALG_LEVEL0_4P_MESH, "fullmesh"},
{AlgTypeLevel0::ALG_LEVEL0_2P_MESH, "fullmesh"},
{AlgTypeLevel0::ALG_LEVEL0_1P_MESH, "fullmesh"},
{AlgTypeLevel0::ALG_LEVEL0_4P_RING, "ring"},
{AlgTypeLevel0::ALG_LEVEL0_NP_SINGLE_RING, "ring"},
{AlgTypeLevel0::ALG_LEVEL0_NP_MESH, "fullmesh"},
{AlgTypeLevel0::ALG_LEVEL0_NP_HD, "HD"},
{AlgTypeLevel0::ALG_LEVEL0_NP_STAR, "star"},
{AlgTypeLevel0::ALG_LEVEL0_RESERVED, "null"},
};
const std::map<AlgTypeLevel1, std::string> HCCL_ALGO_LEVEL1_NAME_MAP = {
{AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING, "ring"},
{AlgTypeLevel1::ALG_LEVEL1_HD, "H-D"},
{AlgTypeLevel1::ALG_LEVEL1_RING, "ring"},
{AlgTypeLevel1::ALG_LEVEL1_PIPELINE, "pipeline"},
{AlgTypeLevel1::ALG_LEVEL1_NHR, "NHR"},
{AlgTypeLevel1::ALG_LEVEL1_NHR_V1, "NHR_V1"},
{AlgTypeLevel1::ALG_LEVEL1_AHC, "AHC"},
{AlgTypeLevel1::ALG_LEVEL1_AHC_BROKE, "AHC_BROKE"},
{AlgTypeLevel1::ALG_LEVEL1_NB, "NB"},
{AlgTypeLevel1::ALG_LEVEL1_RESERVED, "null"},
};
const std::map<AlgTypeLevel2, std::string> HCCL_ALGO_LEVEL2_NAME_MAP = {
{AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING, "ring"},
{AlgTypeLevel2::ALG_LEVEL2_HD, "H-D"},
{AlgTypeLevel2::ALG_LEVEL2_RING, "ring"},
{AlgTypeLevel2::ALG_LEVEL2_NHR, "NHR"},
{AlgTypeLevel2::ALG_LEVEL2_NB, "NB"},
{AlgTypeLevel2::ALG_LEVEL2_PIPELINE, "pipeline"},
{AlgTypeLevel2::ALG_LEVEL2_RESERVED, "null"},
};
const std::map<AlgTypeLevel0, std::string> HCCL_ALGO_LEVEL0_MAP = {
{AlgTypeLevel0::ALG_LEVEL0_NP_DOUBLE_RING, "RING"},
{AlgTypeLevel0::ALG_LEVEL0_WHOLE_RING, "RING"},
{AlgTypeLevel0::ALG_LEVEL0_8P_RING, "RING"},
{AlgTypeLevel0::ALG_LEVEL0_4P_MESH, "MESH"},
{AlgTypeLevel0::ALG_LEVEL0_2P_MESH, "MESH"},
{AlgTypeLevel0::ALG_LEVEL0_1P_MESH, "MESH"},
{AlgTypeLevel0::ALG_LEVEL0_4P_RING, "RING"},
{AlgTypeLevel0::ALG_LEVEL0_NP_SINGLE_RING, "RING"},
{AlgTypeLevel0::ALG_LEVEL0_NP_MESH, "MESH"},
{AlgTypeLevel0::ALG_LEVEL0_NP_HD, "HD"},
{AlgTypeLevel0::ALG_LEVEL0_NP_STAR, "STAR"},
{AlgTypeLevel0::ALG_LEVEL0_PAIRWISE, "PAIRWISE"},
{AlgTypeLevel0::ALG_LEVEL0_RESERVED, "NA"},
};
const std::map<AlgTypeLevel1, std::string> HCCL_ALGO_LEVEL1_MAP = {
{AlgTypeLevel1::ALG_LEVEL1_WHOLE_RING, "RING"},
{AlgTypeLevel1::ALG_LEVEL1_HD, "HD"},
{AlgTypeLevel1::ALG_LEVEL1_RING, "RING"},
{AlgTypeLevel1::ALG_LEVEL1_PIPELINE, "PIPELINE"},
{AlgTypeLevel1::ALG_LEVEL1_NHR, "NHR"},
{AlgTypeLevel1::ALG_LEVEL1_NHR_V1, "NHR_V1"},
{AlgTypeLevel1::ALG_LEVEL1_AHC, "AHC"},
{AlgTypeLevel1::ALG_LEVEL1_AHC_BROKE, "AHC_BROKE"},
{AlgTypeLevel1::ALG_LEVEL1_NB, "NB"},
{AlgTypeLevel1::ALG_LEVEL1_STAR, "STAR"},
{AlgTypeLevel1::ALG_LEVEL1_RESERVED, "NA"},
};
const std::map<AlgTypeLevel2, std::string> HCCL_ALGO_LEVEL2_MAP = {
{AlgTypeLevel2::ALG_LEVEL2_WHOLE_RING, "RING"},
{AlgTypeLevel2::ALG_LEVEL2_HD, "HD"},
{AlgTypeLevel2::ALG_LEVEL2_RING, "RING"},
{AlgTypeLevel2::ALG_LEVEL2_NHR, "NHR"},
{AlgTypeLevel2::ALG_LEVEL2_NB, "NB"},
{AlgTypeLevel2::ALG_LEVEL2_PIPELINE, "PIPELINE"},
{AlgTypeLevel2::ALG_LEVEL2_RESERVED, "NA"},
};
inline std::string TransferAlgType(AlgType algType)
{
std::string algTypeStr;
auto level0Iter = HCCL_ALGO_LEVEL0_MAP.find(algType.algoLevel0);
auto level1Iter = HCCL_ALGO_LEVEL1_MAP.find(algType.algoLevel1);
auto level2Iter = HCCL_ALGO_LEVEL2_MAP.find(algType.algoLevel2);
if (level0Iter == HCCL_ALGO_LEVEL0_MAP.end() || level1Iter == HCCL_ALGO_LEVEL1_MAP.end() || level2Iter == HCCL_ALGO_LEVEL2_MAP.end()) {
algTypeStr = "not found";
HCCL_WARNING("No matching algLevel0 or algLevel1 or algLevel2 is found.");
} else {
algTypeStr.append(static_cast<std::string>(level0Iter->second)).append("-").append(static_cast<std::string>(level1Iter->second))
.append("-").append(static_cast<std::string>(level2Iter->second));
HCCL_INFO("The algtype for profiling is [%s]", algTypeStr.c_str());
}
return algTypeStr;
}
inline bool TransferStrToAlgType(const std::string& algTypeStr, AlgType& algType)
{
std::vector<std::string> parts;
std::stringstream ss(algTypeStr);
std::string part;
constexpr u32 algTypeLevelNum = 3;
while (std::getline(ss, part, '-')) {
parts.push_back(part);
}
if (parts.size() != algTypeLevelNum) {
HCCL_ERROR("Invalid algType string format: %s", algTypeStr.c_str());
return false;
}
int level0Val = std::stoi(parts[0]);
int level1Val = std::stoi(parts[1]);
int level2Val = std::stoi(parts[2]);
if (level0Val >= static_cast<int>(AlgTypeLevel0::ALG_LEVEL0_RESERVED) || level0Val < 0
|| level1Val >= static_cast<int>(AlgTypeLevel1::ALG_LEVEL1_RESERVED) || level1Val < 0
|| level2Val >= static_cast<int>(AlgTypeLevel2::ALG_LEVEL2_RESERVED) || level2Val < 0)
{
HCCL_ERROR("Invalid algType string format: %s", algTypeStr.c_str());
return false;
}
algType.algoLevel0 = static_cast<AlgTypeLevel0>(level0Val);
algType.algoLevel1 = static_cast<AlgTypeLevel1>(level1Val);
algType.algoLevel2 = static_cast<AlgTypeLevel2>(level2Val);
HCCL_INFO("Successfully parsed algType from string: %s", algTypeStr.c_str());
return true;
}
}
enum class TopoType {
TOPO_TYPE_COMMON = 0,
TOPO_TYPE_8P_RING = 1,
TOPO_TYPE_4P_MESH = 2,
TOPO_TYPE_2P_MESH = 3,
TOPO_TYPE_1P_MESH = 4,
TOPO_TYPE_4P_RING = 5,
TOPO_TYPE_NP_SINGLE_RING = 6,
TOPO_TYPE_8P_MESH = 7,
TOPO_TYPE_NP_MESH = 8,
TOPO_TYPE_NP_DOUBLE_RING = 9,
TOPO_TYPE_HETEROG = 10,
TOPO_TYPE_ES_MESH = 11,
TOPO_TYPE_RESERVED
};
#endif