blob: a2b84d6d32e79b16031023da92a44902feb39939 [file] [log] [blame]
#!/bin/bash
# This script tests the Joshua pipeline, training on a 1000-sentence Urdu-English parallel corpus,
# and tuning and testing on 100-sentence test sets with four references. It uses the Berkeley
# aligner for alignment to avoid the dependency on compiling GIZA.
rm -rf 2
$JOSHUA/scripts/training/pipeline.pl \
--readme "testing GHKM extraction" \
--rundir 2 \
--type ghkm \
--source ur \
--target en \
--corpus input/train \
--last-step GRAMMAR \
--aligner-mem 4g \
--aligner berkeley > pipeline-ghkm.log 2>&1
#diff -u 1/test/final-bleu final-bleu.gold
size=$(perl -e "print +(stat('2/grammar.gz'))[7]")
if [[ $size -ne 0 ]]; then
exit 0
else
exit 1
fi