import os
import unittest
from mskpp import Tensor, Chip, vmaddrelu, vmla
from mskpp._C import task_schedule
from test.utils.test_base import TestBase
UB_MEM = "UB"
GM_MEM = "GM"
FP_16_TYPE = "FP16"
FP_32_TYPE = "FP32"
FORMAT_TYPE = "ND"
def my_vmaddrelu(gm_x, gm_y, gm_z):
x = Tensor(UB_MEM)
y = Tensor(UB_MEM)
z = Tensor(UB_MEM)
x.load(gm_x)
y.load(gm_y)
out = vmaddrelu(x, y, z)()
gm_z.load(out[0])
def my_vmla(gm_x, gm_y, gm_z, if_mix=False):
x = Tensor(UB_MEM)
y = Tensor(UB_MEM)
z = Tensor(UB_MEM)
x.load(gm_x)
y.load(gm_y)
out = vmla(x, y, z, if_mix)()
gm_z.load(out[0])
class TestUtilsMethods(TestBase):
TRACE_FILE = 'trace.json'
def clean(self):
task_schedule.Schedule().clean()
work_dir = os.getcwd()
self.batch_delete_folders(work_dir, 'MSKPP_*')
def test_vmaddrelu_fp32_expect_trace_successful_create(self):
with Chip("Ascend910B1") as chip:
chip.enable_trace()
in_x_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_y_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_z_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_x_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
in_y_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
in_z_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
my_vmaddrelu(in_x_fp16, in_y_fp16, in_z_fp16)
my_vmaddrelu(in_x_fp32, in_y_fp32, in_z_fp32)
trace_file = os.path.join(chip.output_dir, self.TRACE_FILE)
self.assertTrue(os.path.exists(trace_file))
self.clean()
def test_vmla_expect_trace_successful_create(self):
with Chip("Ascend910B1") as chip:
chip.enable_trace()
in_x_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_y_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_x_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
in_y_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
in_z_fp16 = Tensor(GM_MEM, FP_16_TYPE, [64, 128], format=FORMAT_TYPE)
in_z_fp32 = Tensor(GM_MEM, FP_32_TYPE, [64, 128], format=FORMAT_TYPE)
my_vmla(in_x_fp32, in_y_fp32, in_z_fp32)
my_vmla(in_x_fp16, in_y_fp16, in_z_fp16)
my_vmla(in_x_fp16, in_y_fp16, in_z_fp32, True)
trace_file = os.path.join(chip.output_dir, self.TRACE_FILE)
self.assertTrue(os.path.exists(trace_file))
self.clean()
if __name__ == '__main__':
unittest.main()