{
"type": "text",
"name": "qwen3-vl-2b-prefill",
"description": "Qwen3-VL-2B prefill, 1 query, qlen=27, img=1080x1920, compile",
"initial_time_s": 0.116223,
"baseline_time_s": 0.057731,
"initial_tolerance": 0.1,
"baseline_tolerance": 1.02,
"operator_top_n": 10,
"operator_tolerance": 0.1,
"user_input": {
"device": "ATLAS_800_A2_376T_64G",
"model_id": "Qwen/Qwen3-VL-2B-Instruct",
"num_queries": 1,
"query_len": 27,
"context_length": 0,
"prefix_cache_hit_rate": 0.0,
"do_compile": true,
"allow_graph_break": false,
"enable_multistream": true,
"dump_input_shapes": false,
"chrome_trace": null,
"graph_log_url": null,
"log_level": null,
"quantize_linear_action": "DISABLED",
"quantize_lmhead": false,
"mxfp4_group_size": 32,
"quantize_attention_action": "DISABLED",
"enable_sequence_parallel": false,
"decode": false,
"num_mtp_tokens": 0,
"mtp_acceptance_rate": [
0.9,
0.6,
0.4,
0.2
],
"num_hidden_layers_override": 0,
"disable_repetition": false,
"reserved_memory_gb": 0,
"world_size": 1,
"tp_size": 1,
"pp_size": 1,
"dp_size": null,
"o_proj_tp_size": null,
"o_proj_dp_size": null,
"mlp_tp_size": null,
"mlp_dp_size": null,
"lmhead_tp_size": null,
"lmhead_dp_size": null,
"ep_size": 1,
"moe_dp_size": 1,
"moe_tp_size": null,
"word_embedding_tp": null,
"enable_redundant_experts": false,
"enable_shared_expert_tp": false,
"enable_dispatch_ffn_combine": false,
"enable_external_shared_experts": false,
"host_external_shared_experts": false,
"block_size": 128,
"remote_source": "huggingface",
"image_batch_size": 1,
"image_height": 1080,
"image_width": 1920,
"performance_model": [
"analytic"
],
"profiling_database": null
},
"operators": [
{
"name": "tensor_cast.attention.default",
"total_time_s": 0.035999,
"num_calls": 52
},
{
"name": "aten.mm.default",
"total_time_s": 0.023312000000000003,
"num_calls": 113
},
{
"name": "aten.addmm.default",
"total_time_s": 0.020806,
"num_calls": 104
},
{
"name": "aten.add.Tensor",
"total_time_s": 0.007976,
"num_calls": 136
},
{
"name": "aten.mul.Tensor",
"total_time_s": 0.006611,
"num_calls": 107
},
{
"name": "aten._to_copy.default",
"total_time_s": 0.0047599999999999995,
"num_calls": 100
},
{
"name": "aten.cat.default",
"total_time_s": 0.003983,
"num_calls": 74
},
{
"name": "aten.gelu.default",
"total_time_s": 0.003222,
"num_calls": 28
},
{
"name": "tensor_cast.swiglu.default",
"total_time_s": 0.002079,
"num_calls": 28
},
{
"name": "aten.native_layer_norm.default",
"total_time_s": 0.0017540000000000001,
"num_calls": 52
}
]
}