blob: 00dbee118e5a522bf705bd13b24339c13376c5a5 [file] [log] [blame]
#! /bin/bash
## Takes args $1 (NUM_COPIES) and $2 (GPFDIST_PORT)
# Create dataset directory that gpfdist will host
if [ -d $MASTER_DATA_DIRECTORY/perfdataset ]; then
rm -rf $MASTER_DATA_DIRECTORY/perfdataset
fi
mkdir $MASTER_DATA_DIRECTORY/perfdataset
# Generate dataset
# TODO: this is very slow to generate big datasets (e.g. 500 million
# rows)... need to replace with something much faster
for i in $(seq ${1}); do
cat dataset/perfdata.csv >> $MASTER_DATA_DIRECTORY/perfdataset/perfdata.csv;
done
# Kill gpfdist processes and host the dataset
killall gpfdist
sleep 5
gpfdist -p $2 -d $MASTER_DATA_DIRECTORY/perfdataset -l $MASTER_DATA_DIRECTORY/perfdataset/gpfdist.log &
# Update sql and ans file with hostname and gpfdist port
cat ./sql/setup.sql.template | sed "s/@hostname@:@gpfdist_port@/${HOSTNAME}:${2}/" > ./sql/setup.sql
cat ./expected/setup.out.template | sed "s/@hostname@:@gpfdist_port@/${HOSTNAME}:${2}/" > ./expected/setup.out