test/pipeline/test-ghkm.sh - joshua - Git at Google

 #!/bin/bash

 # This script tests the Joshua pipeline, training on a 1000-sentence Urdu-English parallel corpus,
 # and tuning and testing on 100-sentence test sets with four references.  It uses the Berkeley
 # aligner for alignment to avoid the dependency on compiling GIZA.

 rm -rf 2
 $JOSHUA/scripts/training/pipeline.pl \
     --readme "testing GHKM extraction" \
     --rundir 2                 \
     --type ghkm                \
     --source ur                \
     --target en                \
     --corpus input/train       \
     --last-step GRAMMAR        \
     --aligner-mem 4g           \
     --aligner berkeley > pipeline-ghkm.log 2>&1

 #diff -u 1/test/final-bleu final-bleu.gold

 size=$(perl -e "print +(stat('2/grammar.gz'))[7]")
 if [[ $size -ne 0 ]]; then
 	exit 0
 else
 	exit 1
 fi
	#!/bin/bash

	# This script tests the Joshua pipeline, training on a 1000-sentence Urdu-English parallel corpus,
	# and tuning and testing on 100-sentence test sets with four references. It uses the Berkeley
	# aligner for alignment to avoid the dependency on compiling GIZA.

	rm -rf 2
	$JOSHUA/scripts/training/pipeline.pl \
	--readme "testing GHKM extraction" \
	--rundir 2 \
	--type ghkm \
	--source ur \
	--target en \
	--corpus input/train \
	--last-step GRAMMAR \
	--aligner-mem 4g \
	--aligner berkeley > pipeline-ghkm.log 2>&1

	#diff -u 1/test/final-bleu final-bleu.gold

	size=$(perl -e "print +(stat('2/grammar.gz'))[7]")
	if [[ $size -ne 0 ]]; then
	exit 0
	else
	exit 1
	fi