#!/bin/bash
set -e
set -x
NAMES=${1:-'*.yaml'}
TARGET=feature_specs/${NAMES}
OPTIONS=${2-""}
for file in ${TARGET};
do
echo "${file}";
done
for fspec_file in ${TARGET};
do
SYNTH_DATA_DIR=/tmp/generated_data/${fspec_file}
python -m dlrm.scripts.prepare_synthetic_dataset --feature_spec ${fspec_file} --synthetic_dataset_dir ${SYNTH_DATA_DIR}
for mlp in True False;
do
for graphs in True;
do
for dot in cuda_dot dot;
do
for amp in True False;
do
python -m dlrm.scripts.main --mode train --dataset ${SYNTH_DATA_DIR} --optimized_mlp=${mlp} --cuda_graphs=${graphs} --interaction_op=${dot} --embedding_type=joint_sparse --amp=${amp}
python -m torch.distributed.launch --no_python --use_env --nproc_per_node 8 bash -c "/workspace/dlrm/bind.sh --cpu=exclusive -- python -m dlrm.scripts.main --dataset ${SYNTH_DATA_DIR} --optimized_mlp=${mlp} --cuda_graphs=${graphs} --interaction_op=${dot} --embedding_type=joint_sparse --amp=${amp}"
done;
done
done
done
rm -r ${SYNTH_DATA_DIR}
done