blob: 7573f75b9d699fd8f88ec2107ee88ab82d2504eb [file] [log] [blame]
#!/bin/bash
# This builds a model on Europarl (assuming you've downloaded it:
# http://statmt.org/wmt14/translation-task.html), tuning against WMT's
# newstest 2013, and testing against 2014. It also includes an extra LM,
# built (separately, using KenLM's tool available at $JOSHUA/bin/lmplz)
# on Gigaword
. ~/.bashrc
set -u
$JOSHUA/bin/pipeline.pl \
--rundir 2 \
--readme "Baseline Hiero model" \
--type hiero \
--source es \
--target en \
--corpus /path/to/europarl/europarl-v7.es-en
--corpus /path/to/europarl/news-commentary-v7.es-en
--tune /path/to/newstest/newstest2013
--test /path/to/newstest/newstest2014
--threads 8 \
--tuner mert \
--joshua-mem 20g \
--packer-mem 16g \
--lmfile /path/to/gigaword/lmfile \
--optimizer-runs 5