model_config:
model_name: "deepseek_r1"
model_path: "/data/models/origin/DeepSeek-R1-W8A8"
with_ckpt: True
exe_mode: "npugraph_ex"
enable_static_kernel: False
enable_profiler: False
force_eplb: False
enable_cache_compile: False
custom_params:
enable_mla_prolog: True
enable_multi_streams: True
enable_superkernel: False
moe_chunk_max_len: 65536
micro_batch_mode: 0
data_config:
dataset: "LongBench"
input_truncated_len: 256
parallel_config:
world_size: 16
attn_tp_size: 16
dense_tp_size: 16
moe_tp_size: 16
embed_tp_size: 16
lmhead_tp_size: 16
scheduler_config:
block_size: 128
max_new_tokens: 100
max_prefill_tokens: 256
batch_size: 1