01_simd_cpp_api/05_best_practices/03_fusion_compute/quant_group_matmul_high_performance
01_simd_cpp_api/02_features/05_aclrtc/rtc_hello_world
01_simd_cpp_api/02_features/05_aclrtc/rtc_template_add
01_simd_cpp_api/00_introduction/00_quickstart/hello_world
02_simd_c_api/02_features/03_c_api/00_vector_compute/02_c_api_delicacy_async_add
02_simd_c_api/02_features/03_c_api/00_vector_compute/01_async_add
02_simd_c_api/00_introduction/01_add/c_api_delicacy_async_add
02_simd_c_api/00_introduction/01_add/c_api_async_add
02_simd_c_api/00_introduction/01_add/c_api_sync_add
02_simd_c_api/02_features/03_c_api/00_vector_compute/00_sync_add
01_simd_cpp_api/02_features/00_framework/00_pytorch/pybind
01_simd_cpp_api/02_features/00_framework/00_pytorch/ge_torchair
02_simd_c_api/00_introduction/00_quickstart/hello_world_npu
04_aicpu/00_introduction/00_device_tiling/aicpu_device_tiling
01_simd_cpp_api/03_basic_api/05_sync_control/group_barrier
01_simd_cpp_api/04_advanced_api/10_math/log
01_simd_cpp_api/06_compatibility_guide/fill
01_simd_cpp_api/06_compatibility_guide/scatter
01_simd_cpp_api/03_basic_api/09_utils/gm_by_pass_dcache
01_simd_cpp_api/03_basic_api/03_matrix_compute/mmad_unitflag
01_simd_cpp_api/03_basic_api/05_sync_control/task_sync
01_simd_cpp_api/06_compatibility_guide/data_copy_l1togm
01_simd_cpp_api/03_basic_api/00_data_movement/copy_ub2ub
01_simd_cpp_api/01_utilities/04_profiling/torch_library_report_tensor
01_simd_cpp_api/03_basic_api/06_atomic/data_movement_with_atomic_operations
01_simd_cpp_api/03_basic_api/05_sync_control/data_sync_barrier
01_simd_cpp_api/01_utilities/04_profiling/msprof
01_simd_cpp_api/03_basic_api/03_matrix_compute/mmad
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/duplicate
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/reduce_pair_elem
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/cast
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/element_wise_compound_compute
01_simd_cpp_api/03_basic_api/03_matrix_compute/fixpipe_l0c2gm
01_simd_cpp_api/03_basic_api/00_data_movement/data_copy_gm2ub_slice
01_simd_cpp_api/03_basic_api/05_sync_control/sync_all
01_simd_cpp_api/02_features/00_framework/00_pytorch/torch_library
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/element_wise_logic
01_simd_cpp_api/03_basic_api/00_data_movement/data_copy_gm2l1
01_simd_cpp_api/00_introduction/02_matrix/matmul_basic_api
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/element_wise_arithmetic
01_simd_cpp_api/06_compatibility_guide/pattern_transformation
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/reduce_data_block
01_simd_cpp_api/03_basic_api/07_tpipe_tque/tpipe_reuse
01_simd_cpp_api/03_basic_api/00_data_movement/data_copy_pad_gm2ub_ub2gm
01_simd_cpp_api/03_basic_api/05_sync_control/sequential_block_sync
01_simd_cpp_api/03_basic_api/03_matrix_compute/load_data_l12l0
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/transpose
01_simd_cpp_api/04_advanced_api/11_utils/type_traits
01_simd_cpp_api/00_introduction/01_add/add
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/brcb
01_simd_cpp_api/03_basic_api/03_matrix_compute/mmad_gemv
01_simd_cpp_api/06_compatibility_guide/set_loaddata_boundary
01_simd_cpp_api/03_basic_api/04_memory_management/tmp_buffer
01_simd_cpp_api/00_introduction/01_add/add_tpipe_tque
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/compare
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/create_vec_index
01_simd_cpp_api/03_basic_api/05_sync_control/ib_set_wait
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/select
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/gather
01_simd_cpp_api/02_features/99_acl_based/00_acl_compilation/custom_op_static_lib
01_simd_cpp_api/02_features/99_acl_based/00_acl_compilation/parallel_ops_package
01_simd_cpp_api/00_introduction/03_fusion_operation/matmul_leakyrelu_basic_api
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/mrg_sort
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/reduce_computation
01_simd_cpp_api/03_basic_api/03_matrix_compute/mmad_load3dv2
01_simd_cpp_api/04_advanced_api/10_math/erf
01_simd_cpp_api/03_basic_api/03_matrix_compute/fixpipe_l0c2l1
01_simd_cpp_api/03_basic_api/03_matrix_compute/mmad_with_sparse
01_simd_cpp_api/04_advanced_api/04_reduce/reduce
01_simd_cpp_api/01_utilities/01_assert
01_simd_cpp_api/04_advanced_api/08_transpose/fill
01_simd_cpp_api/03_basic_api/01_memory_vector_compute/reduce_repeat
01_simd_cpp_api/04_advanced_api/02_normalization/rmsnorm
01_simd_cpp_api/03_basic_api/04_memory_management/tbufpool_management
01_simd_cpp_api/01_utilities/05_sanitizer/ms_sanitizer
01_simd_cpp_api/03_basic_api/03_matrix_compute/batch_matmul
01_simd_cpp_api/03_basic_api/05_sync_control/cross_core_set_wait_flag
01_simd_cpp_api/01_utilities/00_printf/simple_printf
01_simd_cpp_api/05_best_practices/04_memory_access/bank_conflict_nd2nz
01_simd_cpp_api/03_basic_api/06_atomic/set_atomic_deterministic_computation
01_simd_cpp_api/01_utilities/02_dump/simple_dump
01_simd_cpp_api/03_basic_api/07_tpipe_tque/get_tpipe_ptr
01_simd_cpp_api/03_basic_api/00_data_movement/data_copy_l0c2gm
01_simd_cpp_api/05_best_practices/01_matrix_compute/matmul_high_performance
01_simd_cpp_api/03_basic_api/04_memory_management/list_tensor_desc_input
01_simd_cpp_api/05_best_practices/04_memory_access/data_copy
01_simd_cpp_api/05_best_practices/00_vector_compute/add_high_performance
01_simd_cpp_api/04_advanced_api/04_reduce/sum
01_simd_cpp_api/06_compatibility_guide/matmul_s4
01_simd_cpp_api/04_advanced_api/10_math/ceil
01_simd_cpp_api/04_advanced_api/08_transpose/unpad
01_simd_cpp_api/04_advanced_api/01_activation/swiglu
01_simd_cpp_api/04_advanced_api/01_activation/gelu
01_simd_cpp_api/04_advanced_api/03_quantization/dequant
01_simd_cpp_api/04_advanced_api/07_filter/dropout
01_simd_cpp_api/02_features/99_acl_based/00_acl_compilation/custom_op
01_simd_cpp_api/04_advanced_api/10_math/exp
01_simd_cpp_api/04_advanced_api/08_transpose/broadcast
01_simd_cpp_api/04_advanced_api/01_activation/swish
01_simd_cpp_api/04_advanced_api/10_math/clampmin
01_simd_cpp_api/04_advanced_api/10_math/axpy_half_float
01_simd_cpp_api/04_advanced_api/06_index/arange
01_simd_cpp_api/04_advanced_api/10_math/xor
01_simd_cpp_api/04_advanced_api/03_quantization/quant
01_simd_cpp_api/04_advanced_api/03_quantization/antiquant
01_simd_cpp_api/04_advanced_api/04_reduce/reducemax
01_simd_cpp_api/04_advanced_api/08_transpose/transdata
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_sparse
01_simd_cpp_api/04_advanced_api/10_math/fmod
01_simd_cpp_api/04_advanced_api/01_activation/geglu
01_simd_cpp_api/04_advanced_api/10_math/acosh
01_simd_cpp_api/04_advanced_api/07_filter/select
04_aicpu/02_features/00_framwork/00_pytorch/tiling_sink_programming
01_simd_cpp_api/02_features/99_acl_based/01_acl_invocation/aclnn_invocation
01_simd_cpp_api/02_features/00_framework/02_onnx/onnx_plugin
01_simd_cpp_api/02_features/00_framework/03_ge/triple_chevron_notation
01_simd_cpp_api/02_features/00_framework/01_tensorflow/tensorflow_builtin
01_simd_cpp_api/02_features/00_framework/01_tensorflow/tensorflow_custom
01_simd_cpp_api/02_features/99_acl_based/01_acl_invocation/aclop_invocation
01_simd_cpp_api/04_advanced_api/05_sort/sort
01_simd_cpp_api/04_advanced_api/02_normalization/layernorm_v2
01_simd_cpp_api/04_advanced_api/02_normalization/deepnorm
01_simd_cpp_api/04_advanced_api/08_transpose/pad
01_simd_cpp_api/04_advanced_api/05_sort/topk
01_simd_cpp_api/04_advanced_api/01_activation/logsoftmax
01_simd_cpp_api/04_advanced_api/02_normalization/welford
01_simd_cpp_api/04_advanced_api/00_matmul/matmul
01_simd_cpp_api/04_advanced_api/01_activation/softmaxgrad
01_simd_cpp_api/04_advanced_api/08_transpose/transpose
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_multi_core_unaligned
01_simd_cpp_api/04_advanced_api/01_activation/softmaxflashv3
01_simd_cpp_api/00_introduction/02_matrix/matmul_advanced_api
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_constant_tiling
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_tscm
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_l0cache
01_simd_cpp_api/04_advanced_api/02_normalization/layernorm
01_simd_cpp_api/04_advanced_api/01_activation/softmax
01_simd_cpp_api/05_best_practices/03_fusion_compute/matmul_gelu_high_performance
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_callback
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_channelsplit_output
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_format_gemv
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_splitk
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_mixdualmaster
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_co1_output
01_simd_cpp_api/04_advanced_api/08_transpose/add_broadcast
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_format_nd_align
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_mn_double_buffer
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_nbuffer33
01_simd_cpp_api/04_advanced_api/01_activation/softmaxflashv2
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_triangle
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_fused_manual
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_preload
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_unitflag
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_a2b2_share
01_simd_cpp_api/04_advanced_api/00_matmul/batch_matmul
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_async_iterate_all
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_int4
01_simd_cpp_api/05_best_practices/01_matrix_compute/matmul_basic_api_high_performance
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_fused
01_simd_cpp_api/04_advanced_api/00_matmul/batch_matmul_bias_reuse
01_simd_cpp_api/00_introduction/03_fusion_operation/matmul_leakyrelu_advanced_api
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_ibshareB
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_partial_output
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_async_iterate
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_ibshareAB
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_k_reorder_load
01_simd_cpp_api/04_advanced_api/00_matmul/batch_matmul_iterate_n_batch
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_l2cache
01_simd_cpp_api/04_advanced_api/00_matmul/matmul_quant
01_simd_cpp_api/04_advanced_api/10_math/frac
01_simd_cpp_api/04_advanced_api/10_math/cumsum
01_simd_cpp_api/04_advanced_api/10_math/power
01_simd_cpp_api/04_advanced_api/01_activation/sigmoid