MindSpeed-MM/examples/diffusers/sd3/patch_sd3.py-代码预览-MindSpeed-MM:基于昇腾芯片的多模态大模型训练套件项目 - AtomGit

e3fc92f6创建于 2024年12月18日历史提交
#!/usr/bin/env python
# coding=utf-8
# Copyright 2024 The HuggingFace Inc. team. All rights reserved.
# Copyright 2024 Huawei Technologies Co., Ltd
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


import torch
from diffusers import StableDiffusion3Pipeline
from peft.utils import get_peft_model_state_dict


# Save Lora weights for checkpointing steps
def create_save_model_hook(
    accelerator,
    unwrap_model,
    transformer,
    text_encoder_one,
    text_encoder_two,
    args,
    weight_dtype,
):
    def save_model_hook(models, weights, output_dir):
        if accelerator.is_main_process:
            transformer_lora_layers_to_save = None
            text_encoder_one_lora_layers_to_save = None
            text_encoder_two_lora_layers_to_save = None

            for model in models:
                if isinstance(unwrap_model(model), type(unwrap_model(transformer))):
                    transformer_model = unwrap_model(model)
                    if args.upcast_before_saving:
                        transformer_model = transformer_model.to(torch.float32)
                    else:
                        transformer_model = transformer_model.to(weight_dtype)
                    transformer_lora_layers_to_save = get_peft_model_state_dict(
                        transformer_model
                    )

                elif (
                    isinstance(
                        unwrap_model(model), type(unwrap_model(text_encoder_one))
                    )
                    and args.train_text_encoder
                ):
                    # both text encoders are of the same class
                    hidden_size = unwrap_model(model).config.hidden_size
                    if hidden_size == 768:
                        text_encoder_one_lora_layers_to_save = (
                            get_peft_model_state_dict(model.to(torch.float32))
                        )
                    elif hidden_size == 1280:
                        text_encoder_two_lora_layers_to_save = (
                            get_peft_model_state_dict(model.to(torch.float32))
                        )

                elif (
                    isinstance(
                        unwrap_model(model), type(unwrap_model(text_encoder_one))
                    )
                    and not args.train_text_encoder
                ):
                    text_encoder_one_lora_layers_to_save = None
                    text_encoder_two_lora_layers_to_save = None

                else:
                    raise ValueError(f"unexpected save model: {model.__class__}")

                # make sure to pop weight so that corresponding model is not saved again
                if weights:
                    weights.pop()

            StableDiffusion3Pipeline.save_lora_weights(
                output_dir,
                transformer_lora_layers=transformer_lora_layers_to_save,
                text_encoder_lora_layers=text_encoder_one_lora_layers_to_save,
                text_encoder_2_lora_layers=text_encoder_two_lora_layers_to_save,
            )

    return save_model_hook