#! /bin/bash
set -e
export LANG=C.UTF-8
export LC_ALL=C.UTF-8
data_url=`sed '/^data_url=/!d;s/.*=//' url.ini`
git_url=`sed '/^git_url=/!d;s/.*=//' url.ini`
if [ ! -d "./data/dev" ]; then
mkdir -p ./data/dev
wget -nc -O ./data/dev/dev.tgz $data_url
tar -xvzf "./data/dev/dev.tgz" -C "./data/" dev/newstest2014-deen-src.de.sgm dev/newstest2014-deen-ref.en.sgm
fi
if [ ! -d "./mosesdecoder" ]; then
git clone $git_url "./mosesdecoder"
cd ./mosesdecoder
git reset --hard 8c5eaa1a122236bbf927bde4ec610906fea599e6
cd ../
fi
./mosesdecoder/scripts/ems/support/input-from-sgm.perl \
< ./data/dev/newstest2014-deen-src.de.sgm \
> ./data/newstest2014.de
./mosesdecoder/scripts/ems/support/input-from-sgm.perl \
< ./data/dev/newstest2014-deen-ref.en.sgm \
> ./data/newstest2014.en