* Copyright (c) Huawei Technologies Co., Ltd. 2024-2025. All rights reserved.
* This program is free software, you can redistribute it and/or modify it under the terms and conditions of
* CANN Open Software License Agreement Version 2.0 (the "License").
* Please refer to the License for details. You may not use this file except in compliance with the License.
* THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND, EITHER EXPRESS OR IMPLIED,
* INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.
* See LICENSE in the root of the software repository for the full text of the License.
*/
#ifndef TORCH_ATB_ENGER_GRAPH_OPERATION_BUILDER_H
#define TORCH_ATB_ENGER_GRAPH_OPERATION_BUILDER_H
#include "atb/atb_infer.h"
#include "graph_node.h"
#include "operation_wrapper.h"
namespace TorchAtb {
using ReshapeHandler = std::function<std::vector<int64_t>(const std::vector<int64_t> &oldShape)>;
class GraphBuilder {
public:
explicit GraphBuilder(const std::string &graphName);
std::string AddInput(const std::string &name);
GraphNode &AddNode(const std::vector<std::string> &inputs, atb::Operation *operation);
template <typename OpParam>
GraphNode &AddNodeByParamType(const std::vector<std::string> &inputs, const OpParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::LinearParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::LayerNormParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ElewiseParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::SoftmaxParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::SelfAttentionParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::RopeParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::SplitParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::GatherParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ActivationParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::RmsNormParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::AllGatherParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::AsStridedParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::CumsumParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::DynamicNTKParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::MultinomialParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ConcatParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::SliceParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::TransposeParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::GatingParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ReshapeAndCacheParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::FillParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::RazorFusionAttentionParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::AllReduceParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::BroadcastParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ReduceScatterParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::ReduceScatterVParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::LinearParallelParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::LinearSparseParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::RelayAttentionParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::TopkToppSamplingParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, const atb::infer::AllToAllParam ¶m);
GraphNode &AddNode(const std::vector<std::string> &inputs, OperationWrapper &opWrapper);
GraphBuilder &Reshape(const std::string &srcTensorName, const ReshapeHandler &reshapeHandler,
const std::string &reshapedTensorName);
void MarkOutput(const std::string &outTensor);
void SetExecuteStreams(const std::vector<std::uintptr_t> &executeStreams);
OperationWrapper Build();
private:
atb::GraphParam graphParam_;
std::vector<GraphNode> graphNodes_;
uint32_t internalTensorNum_ = 0;
uint32_t GetTensorId(const std::string &tensorName);
void ExecuteStreamsAssign();
std::set<uint32_t> streamIds_;
std::vector<aclrtStream> executeStreams_;
std::map<std::string, uint32_t> inTensorIds_;
std::map<std::string, uint32_t> outTensorIds_;
std::map<std::string, uint32_t> internalTensorIds_;
std::map<std::string, std::pair<std::string, atb::ReshapeFunc>> reshapedTensorIds_;
};
}
#endif