{
"torch_npu":
{
"v2.1": [],
"v2.5": [],
"v2.6": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward"
],
"v2.7": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.8": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.9": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.10": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.11": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.12": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"v2.13": [
"npu_gelu_mul",
"npu_clipped_swiglu",
"npu_sim_exponential_",
"npu_fused_floyd_attention",
"npu_fused_floyd_attention_backward",
"npu_fused_causal_conv1d",
"npu_masked_causal_conv1d",
"npu_masked_causal_conv1d_backward",
"npu_apply_rotary_pos_emb",
"npu_ring_attention_update"
],
"all_version": [
"_npu_dropout",
"copy_memory_",
"empty_with_format",
"empty_with_swapped_memory",
"npu_alloc_float_status",
"npu_apply_adam",
"npu_advance_step_flashattn",
"npu_batch_gather_matmul",
"npu_batch_gather_matmul_",
"npu_block_sparse_attention",
"npu_block_sparse_attention_backward",
"npu_bert_apply_adam",
"npu_clear_float_status",
"npu_cross_entropy_loss",
"npu_format_cast_",
"npu_fusion_attention",
"npu_fusion_attention_v3",
"npu_get_float_status",
"npu_nms_rotated",
"npu_random_choice_with_mask",
"npu_rms_norm",
"npu_add_rms_norm_cast",
"npu_moe_compute_expert_tokens",
"npu_fused_infer_attention_score",
"npu_mla_prolog",
"npu_mla_prolog_v2",
"npu_mla_prolog_v3",
"npu_mla_prolog_v3_functional",
"npu_matmul_compress_dequant",
"npu_quant_lightning_indexer",
"npu_lightning_indexer",
"npu_sparse_flash_attention",
"npu_lightning_indexer_grad",
"npu_sparse_flash_attention_grad",
"npu_sparse_lightning_indexer_grad_kl_loss",
"npu_kv_quant_sparse_flash_attention",
"npu_convert_weight_to_int4pack",
"npu_ffn",
"npu_geglu",
"npu_grouped_matmul",
"npu_moe_finalize_routing",
"npu_mhc_sinkhorn",
"npu_mhc_sinkhorn_backward",
"npu_quant_matmul",
"npu_quant_matmul_reduce_sum",
"npu_quant_scatter",
"npu_quantize",
"npu_dequant_bias",
"npu_group_quant",
"npu_dynamic_quant",
"npu_dynamic_quant_asymmetric",
"npu_scatter_nd_update_",
"npu_scatter_pa_kv_cache",
"npu_stride_copy",
"npu_gemma_rms_norm",
"npu_dequant_swiglu_quant",
"npu_swiglu",
"npu_gelu",
"npu_gelu_backward",
"npu_all_gather_base_mm",
"npu_mm_reduce_scatter_base",
"npu_prefetch",
"npu_quant_scatter_",
"npu_trans_quant_param",
"npu_top_k_top_p_sample",
"scatter_update",
"scatter_update_",
"npu_kronecker_quant",
"npu_group_norm_swish",
"npu_mrope",
"npu_grouped_matmul_finalize_routing",
"npu_grouped_matmul_swiglu_quant_v2",
"npu_recurrent_gated_delta_rule",
"npu_recurrent_gated_delta_rule_functional",
"npu_alltoallv_gmm",
"npu_alltoallv_quant_gmm",
"npu_gmm_alltoallv",
"npu_quant_gmm_alltoallv",
"npu_nsa_compress",
"npu_nsa_compress_infer",
"npu_nsa_compress_attention",
"npu_nsa_compress_attention_infer",
"npu_nsa_select_attention",
"npu_nsa_select_attention_infer",
"npu_transpose_batchmatmul",
"npu_transpose_quant_batchmatmul",
"npu_gather_sparse_index",
"npu_moe_distribute_combine_add_rms_norm",
"npu_moe_update_expert",
"npu_dynamic_block_quant",
"attention_worker_scheduler_",
"attention_worker_scheduler",
"ffn_worker_scheduler_",
"ffn_worker_scheduler",
"npu_moe_gating_top_k_softmax_v2",
"npu_moe_gating_top_k_backward",
"npu_confusion_transpose",
"npu_dense_lightning_indexer_grad_kl_loss",
"npu_dense_lightning_indexer_softmax_lse",
"npu_one_hot",
"npu_quant_matmul_gelu",
"npu_mhc_post",
"npu_mhc_post_backward",
"npu_mhc_pre",
"npu_chunk_gated_delta_rule",
"npu_rotate_quant",
"npu_mhc_pre_backward",
"npu_quant_max"
]
}
}