* Copyright (c) Huawei Technologies Co., Ltd. 2025. All rights reserved.
* MindIE is licensed under Mulan PSL v2.
* You can use this software according to the terms and conditions of the Mulan PSL v2.
* You may obtain a copy of Mulan PSL v2 at:
* http://license.coscl.org.cn/MulanPSL2
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
* EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
* MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
* See the Mulan PSL v2 for more details.
*/
#ifndef COMMUNICATOR_H
#define COMMUNICATOR_H
#include <atomic>
#include <thread>
#include "grpc_communicator.h"
#include "ipc_communicator.h"
namespace mindie_llm {
using SlaveModelInitReqHandler = std::function<bool(std::map<std::string, std::string> &)>;
class Communicator {
public:
Communicator(std::unordered_map<std::string, std::string> &config, bool isMultiNodesInfer, int dpRankIdx,
int remoteDPRankIdx, bool intraNodeTP);
~Communicator();
bool InitIPCCommunicators(const std::string &sharedMemPrefix, uint32_t localWorldSize);
bool InitGRPCCommunicator(std::unordered_map<std::string, std::string> &config,
ResponseHandler responseFromSlaveHandler, uint32_t grpcCommunicatorNum);
void RegisterModelInitReqHandler(SlaveModelInitReqHandler handler);
bool SendModelInitRequestAndReceive(ExecuteRequest &request, std::vector<ExecuteResponse> &responses);
bool SendSharedSyncRequest(ExecuteRequest &request);
bool SendSharedSyncRequestAndReceive(ExecuteRequest &request, std::vector<ExecuteResponse> &responses);
bool SendRecoverCommandRequestAndReceive(ExecuteRequest &request, std::vector<ExecuteResponse> &responses);
bool LaunchIPCHandleResponseThreads(ResponseHandler handler);
bool SendAsyncRequest(ExecuteRequest &request);
bool SendAsyncRequestToRemote(ExecuteRequest &request);
bool GRPCGetSyncResponse(ExecuteResponse &response);
bool SendAsyncReponseToRemote(ExecuteResponse &response);
void CleanUp();
private:
bool LwdGRPCCommunicatorInit(std::unordered_map<std::string, std::string> &config, uint32_t grpcCommunicatorNum);
std::unique_ptr<IPCCommunicator> InitSingleIPCCommunicator(const std::string &sharedMemName,
const SemaphoreConfig &semConfig,
const ShmSizeConfig &shmSizeConfig,
bool receiveAllRank = false) const;
bool RegisterAndStartIPCHandler(std::shared_ptr<IPCCommunicator> ipcCommunicator, ResponseHandler handler) const;
bool SlaveNodeGRPCRequestHandler(ExecuteRequest &request);
bool SlaveNodeGRPCRecoverRequestHandler(ExecuteRequest &request);
ExecuteResponse AggregateToOneResponse(const std::vector<ExecuteResponse> &responses);
bool SlaveNodeIPCResponseHandler(ExecuteResponse &response);
bool SendAsyncRequestToLocal(ExecuteRequest &request);
bool ReceiveSyncResponsesFromRemote(std::vector<ExecuteResponse> &responses);
bool isMultiNodesInfer_;
bool layerwiseDisaggregated_{false};
bool isLwdMultiNodesInfer_{false};
MasterSlaveRole msRole_;
uint32_t numExpectedResponses_{0};
int dpRankIdx_;
int remoteDPRankIdx_;
bool intraNodeTP_;
std::string remoteSlaveIP_;
SlaveModelInitReqHandler slaveModelInitReqHandler_;
std::shared_ptr<GRPCCommunicator> grpcCommunicator_;
std::shared_ptr<IPCCommunicator> ipcCommunicatorExecute_;
std::shared_ptr<IPCCommunicator> ipcCommunicatorSharedSync_;
std::shared_ptr<IPCCommunicator> ipcCommunicatorKVTransfer_;
std::shared_ptr<IPCCommunicator> ipcCommunicatorExecuteError_;
std::shared_ptr<IPCCommunicator> ipcCommunicatorRecoverCommand_;
std::unique_ptr<std::thread> handleExecuteErrorThread_{nullptr};
};
}
#endif