{
"test_deepseek2_hf2mcore_tp1pp4ep8": [
{
"param": {
"load-model-type":"hf",
"save-model-type":"mg",
"target-tensor-parallel-size": "1",
"target-pipeline-parallel-size": "4",
"target-expert-parallel-size": "8",
"load-dir":"/data/ci/models/deepseek-v2/hf/deepseek2_hf",
"save-dir":"/data/ci/cache/deepseek2_tp1pp4ep8",
"moe-grouped-gemm": null,
"model-type-hf": "deepseek2"
}
}
],
"test_deepseek2_mcore2hf_tp1pp4ep8": [
{
"param": {
"load-model-type":"mg",
"save-model-type": "hf",
"target-tensor-parallel-size": "1",
"target-pipeline-parallel-size": "1",
"target-expert-parallel-size": "1",
"save-dir":"/data/ci/cache/deepseek2_mcore2hf_tp1pp4ep8",
"load-dir":"/data/ci/models/deepseek2/mg/deepseek2-l8-t1p4e8-gemm_new",
"moe-grouped-gemm": null,
"model-type-hf": "deepseek2"
}
},
{
"Base_MD5" : [
"1ef5746a963567807c4ae8cbe3a41a6d",
"60954e6785413957795d97225e7f68e0",
"f745e721139f6983a2e670075a54f21f",
"18913d7ddd32a11115c5496a9fee477b",
"d96f48ce36f61ed873bc0cef6ebfc477",
"53cdecbfac8b8344843c44836f3f5508",
"79c0148764502c74fb9e57edb698651e",
"52c2778b5fd83d47fa97985befa4991b"
]
}
],
"test_deepseek3_hf2mcore_tp2pp2vpp1ep2nooplayer": [
{
"param": {
"load-model-type":"hf",
"save-model-type":"mg",
"target-tensor-parallel-size": "2",
"target-pipeline-parallel-size": "2",
"target-expert-parallel-size": "2",
"noop-layers": "0,3",
"load-dir":"/data/ci/models/deepseek3/hf/deepseek3-hf-L2-mtp",
"save-dir":"/data/ci/cache/deepseek3-mtp-L2-tp2pp2ep2vpp1-noop-vpp",
"moe-grouped-gemm": null,
"model-type-hf": "deepseek3",
"num-layers": "2",
"mtp-num-layers": "1",
"first-k-dense-replace": "1",
"num-layers-per-virtual-pipeline-stage": "1"
}
},
{
"Base_MD5" : [
"8805ec24708437fe",
"9f0d52ea91a872ab",
"76fd1c0e20dd533e",
"c356bd6afc0c2b05",
"102f50e55644ece9",
"bc1e75fd4f52e815",
"4ed30b99759f9414",
"0768638e4c6bd700"
]
}
]
}