"""Tests of Checkpoint"""
import sys
import os
import shutil
from pathlib import Path
import logging
import re
import math
import pytest
from mindspeed_llm import megatron_adaptor
from tests.test_tools.utils import create_testconfig, weight_compare, run_cmd, weight_compare_hash
BASE_DIR = Path(__file__).absolute().parents[3]
CKPT_PYPATH = os.path.join(BASE_DIR, "convert_ckpt.py")
CKPTV2_PYPATH = os.path.join(BASE_DIR, "convert_ckpt_v2.py")
class TestCheckpoint(object):
test_config = create_testconfig(Path(__file__).with_suffix(".json"))
test_config_cmd = create_testconfig(Path(__file__).with_suffix(".json"), cmd=True)
def test_deepseek3_hf2mcore_tp2pp2vpp1ep2nooplayer(self):
os.environ["CUDA_DEVICE_MAX_CONNECTIONS"] = "1"
exit_code = run_cmd(["python3", CKPTV2_PYPATH] + self.test_config_cmd['test_deepseek3_hf2mcore_tp2pp2vpp1ep2nooplayer'])
assert exit_code == 0
base_hash = self.test_config['test_deepseek3_hf2mcore_tp2pp2vpp1ep2nooplayer'][1]
save_dir = self.test_config['test_deepseek3_hf2mcore_tp2pp2vpp1ep2nooplayer'][0]['save-dir']
assert weight_compare_hash(save_dir, base_hash, "pt")
shutil.rmtree(save_dir)
def test_deepseek2_hf2mcore_tp1pp4ep8(self):
os.environ["CUDA_DEVICE_MAX_CONNECTIONS"] = "1"
exit_code = run_cmd(["python3", CKPT_PYPATH] + self.test_config_cmd['test_deepseek2_hf2mcore_tp1pp4ep8'])
assert exit_code == 0
base_dir = '/data/ci/models/deepseek2/mg/deepseek2-mla_tp-l8-t1p4e8-gemm_new'
save_dir = self.test_config['test_deepseek2_hf2mcore_tp1pp4ep8'][0]['save-dir']
assert weight_compare(base_dir, save_dir)
shutil.rmtree(save_dir)
def test_deepseek2_mcore2hf_tp1pp4ep8(self):
os.environ["CUDA_DEVICE_MAX_CONNECTIONS"] = "1"
exit_code = run_cmd(["python3", CKPT_PYPATH] + self.test_config_cmd['test_deepseek2_mcore2hf_tp1pp4ep8'])
assert exit_code == 0
base_dir = '/data/ci/models/deepseek-v2/hf/deepseek2_mla-tp_hf_base'
save_dir = os.path.join(self.test_config['test_deepseek2_mcore2hf_tp1pp4ep8'][0]['save-dir'], 'mg2hf')
assert weight_compare(base_dir, save_dir, suffix="safetensors", use_md5=True)
shutil.rmtree(save_dir)