#!/bin/bash
source /usr/local/Ascend/cann/set_env.sh
NPUS_PER_NODE=8
MASTER_ADDR=localhost
MASTER_PORT=19002
NNODES=1
NODE_RANK=0
WORLD_SIZE=$(($NPUS_PER_NODE*$NNODES))
LOAD_PATH="ckpt/flux"
OUTPUT_DIR="data/rl_embeddings"
PROMPT_DIR="data/prompts.txt"
DISTRIBUTED_ARGS="
--nproc_per_node $NPUS_PER_NODE \
--nnodes $NNODES \
--node_rank $NODE_RANK \
--master_addr $MASTER_ADDR \
--master_port $MASTER_PORT
"
GRPO_ARGS="
--load $LOAD_PATH \
--output_dir $OUTPUT_DIR \
--prompt_dir $PROMPT_DIR \
--sample_num 50000 \
"
logfile=$(date +%Y%m%d)_$(date +%H%M%S)
mkdir -p logs
torchrun $DISTRIBUTED_ARGS mindspeed_mm/tasks/rl/soragrpo/preprocess/flux_data_preprocess.py \
$GRPO_ARGS \
2>&1 | tee logs/preprocess_${logfile}.log