{
  "torch_npu":
  {
    "v2.1": [],
    "v2.5": [],
    "v2.6": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward"
    ],
    "v2.7": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.8": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.9": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.10": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.11": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.12": [
      "npu_gelu_mul",
      "npu_clipped_swiglu",
      "npu_sim_exponential_",
      "npu_fused_floyd_attention",
      "npu_fused_floyd_attention_backward",
      "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
    ],
    "v2.13": [
 	    "npu_gelu_mul",
 	    "npu_clipped_swiglu",
 	    "npu_sim_exponential_",
 	    "npu_fused_floyd_attention",
 	    "npu_fused_floyd_attention_backward",
 	    "npu_fused_causal_conv1d",
      "npu_masked_causal_conv1d",
      "npu_masked_causal_conv1d_backward",
      "npu_apply_rotary_pos_emb",
      "npu_ring_attention_update"
 	  ],
    "all_version": [
      "_npu_dropout",
      "copy_memory_",
      "empty_with_format",
      "empty_with_swapped_memory",
      "npu_alloc_float_status",
      "npu_apply_adam",
      "npu_advance_step_flashattn",
      "npu_batch_gather_matmul",
      "npu_batch_gather_matmul_",
      "npu_block_sparse_attention",
      "npu_block_sparse_attention_backward",
      "npu_bert_apply_adam",
      "npu_clear_float_status",
      "npu_cross_entropy_loss",
      "npu_format_cast_",
      "npu_fusion_attention",
      "npu_fusion_attention_v3",
      "npu_get_float_status",
      "npu_nms_rotated",
      "npu_random_choice_with_mask",
      "npu_rms_norm",
      "npu_add_rms_norm_cast",
      "npu_moe_compute_expert_tokens",
      "npu_fused_infer_attention_score",
      "npu_mla_prolog",
      "npu_mla_prolog_v2",
      "npu_mla_prolog_v3",
      "npu_mla_prolog_v3_functional",
      "npu_matmul_compress_dequant",
      "npu_quant_lightning_indexer",
      "npu_lightning_indexer",
      "npu_sparse_flash_attention",
      "npu_lightning_indexer_grad",
      "npu_sparse_flash_attention_grad",
      "npu_sparse_lightning_indexer_grad_kl_loss",
      "npu_kv_quant_sparse_flash_attention",
      "npu_convert_weight_to_int4pack",
      "npu_ffn",
      "npu_geglu",
      "npu_grouped_matmul",
      "npu_moe_finalize_routing",
      "npu_mhc_sinkhorn",
      "npu_mhc_sinkhorn_backward",
      "npu_quant_matmul",
      "npu_quant_matmul_reduce_sum",
      "npu_quant_scatter",
      "npu_quantize",
      "npu_dequant_bias",
      "npu_group_quant",
      "npu_dynamic_quant",
      "npu_dynamic_quant_asymmetric",
      "npu_scatter_nd_update_",
      "npu_scatter_pa_kv_cache",
      "npu_stride_copy",
      "npu_gemma_rms_norm",
      "npu_dequant_swiglu_quant",
      "npu_swiglu",
      "npu_gelu",
      "npu_gelu_backward",
      "npu_all_gather_base_mm",
      "npu_mm_reduce_scatter_base",
      "npu_prefetch",
      "npu_quant_scatter_",
      "npu_trans_quant_param",
      "npu_top_k_top_p_sample",
      "scatter_update",
      "scatter_update_",
      "npu_kronecker_quant",
      "npu_group_norm_swish",
      "npu_mrope",
      "npu_grouped_matmul_finalize_routing",
      "npu_grouped_matmul_swiglu_quant_v2",
      "npu_recurrent_gated_delta_rule",
      "npu_recurrent_gated_delta_rule_functional",
      "npu_alltoallv_gmm",
      "npu_alltoallv_quant_gmm",
      "npu_gmm_alltoallv",
      "npu_quant_gmm_alltoallv",
      "npu_nsa_compress",
      "npu_nsa_compress_infer",
      "npu_nsa_compress_attention",
      "npu_nsa_compress_attention_infer",
      "npu_nsa_select_attention",
      "npu_nsa_select_attention_infer",
      "npu_transpose_batchmatmul",
      "npu_transpose_quant_batchmatmul",
      "npu_gather_sparse_index",
      "npu_moe_distribute_combine_add_rms_norm",
      "npu_moe_update_expert",
      "npu_dynamic_block_quant",
      "attention_worker_scheduler_",
      "attention_worker_scheduler",
      "ffn_worker_scheduler_",
      "ffn_worker_scheduler",
      "npu_moe_gating_top_k_softmax_v2",
      "npu_moe_gating_top_k_backward",
      "npu_confusion_transpose",
      "npu_dense_lightning_indexer_grad_kl_loss",
      "npu_dense_lightning_indexer_softmax_lse",
      "npu_one_hot",
      "npu_quant_matmul_gelu",
      "npu_mhc_post",
      "npu_mhc_post_backward",
      "npu_mhc_pre",
      "npu_chunk_gated_delta_rule",
      "npu_rotate_quant",
      "npu_mhc_pre_backward",
      "npu_quant_max"
    ]
  }

}