blob: 12785cd2e1fb1754391871d1a545d3d7d3a69b53 [file] [log] [blame]
#!/bin/sh
# change these!
NSBASE=ham-logs
SPBASE=spam-logs
SCORESET="0"
passes="1 2 3 4 5 6 7 8 9 10"
mkdir -p tenpass_results
mkdir -p ORIG
> make.output
for id in $passes ; do
notid=
echo "Training for corpus $id..."
pwd; date
> ORIG/ham-set$SCORESET.log
> ORIG/spam-set$SCORESET.log
echo -n "(using corpora blocks: "
for notid in $passes ; do
if [ "$notid" != "$id" ] ; then
echo -n "$notid "
cat $NSBASE/split-$notid.log >> ORIG/ham-set$SCORESET.log
cat $SPBASE/split-$notid.log >> ORIG/spam-set$SCORESET.log
fi
done
echo "for training)"
rm ham.log spam.log
ln ORIG/ham-set$SCORESET.log ham.log
ln ORIG/spam-set$SCORESET.log spam.log
make clean >> make.output
make >> make.output 2>&1
bash -x ./runGA 2>&1 | tee make.output
rm ham.log spam.log
date
echo "Saving test data for corpus $id..."
cp make.output tenpass_results/make.output.$id
cp $NSBASE/split-$id.log tenpass_results/ham-test.log.$id
rm tenpass_results/ham-test.log.$id.gz
gzip tenpass_results/ham-test.log.$id
cp $SPBASE/split-$id.log tenpass_results/spam-test.log.$id
rm tenpass_results/spam-test.log.$id.gz
gzip tenpass_results/spam-test.log.$id
cp gen-set$SCORESET-*/scores tenpass_results/scores.$id
cp gen-set$SCORESET-*/test tenpass_results/test.$id
done