zero3_size: 8
transformer_layers:
  - mindspeed_mm.models.predictor.dits.wan_dit.WanDiTBlock
backward_prefetch: 'BACKWARD_PRE'
param_dtype: "bf16"
reduce_dtype: "fp32"
forward_prefetch: True
limit_all_gathers: True
ignored_modules:
  - ae
  - text_encoder