apiversion: multimodal_sd_modelslim_v1
metadata:
config_id: wan2_2_w8a8f8_mxfp_i2v
score: 90
verified_tags:
Wan2.2-I2V-A14B:
- - MindIE-SD
- Atlas_350
label:
w_bit: 8
a_bit: 8
is_sparse: False
fa_quant: True
spec:
process:
- type: "linear_quant"
qconfig:
act:
scope: "per_block"
dtype: "mxfp8"
symmetric: True
method: "minmax"
weight:
scope: "per_block"
dtype: "mxfp8"
symmetric: True
method: "minmax"
include:
- "*"
- type: "online_quarot"
include:
- "*.self_attn.*"
- type: "fa3_quant"
qconfig:
dtype: "fp8_e4m3"
scope: "per_token"
symmetric: True
method: "minmax"
include:
- "*self_attn"
dataset: wan2_2_i2v
save:
- type: "mindie_format_saver"
part_file_size: 0
multimodal_sd_config:
dump_config:
enable_dump: False
capture_mode: "args"
dump_data_dir: ""
inference_config:
size: "1280*720"
frame_num: 81
sample_steps: 40
convert_model_dtype: True
task: "i2v-A14B"