# Copyright(C) 2024. Huawei Technologies Co.,Ltd. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from argparse import ArgumentParser
from auto_optimizer import OnnxGraph
def main():
# 根据前人的模型处理经验,Decoder需要在ONNXSIM之后关闭一个融合算子。
# 经测试,生成的onnx可以atc转出om模型,精度对齐。
parser = ArgumentParser()
parser.add_argument("--onnx", type=str, required=True)
args = parser.parse_args()
graph = OnnxGraph.parse(args.onnx)
graph.remove("/decoder/Clip")
gather = graph["/decoder/embedding/Gather"]
gather.inputs[1] = "y"
graph.update_map()
graph.infershape()
g_sim = graph.simplify()
save_path = args.onnx.replace(".onnx", "_modified.onnx")
g_sim.save(save_path)
print("Modified model saved to ", save_path)
if __name__ == "__main__":
main()