thirdparty/rocksdb/tools/run_leveldb.sh - nifi-minifi-cpp - Git at Google

 #!/usr/bin/env bash
 # REQUIRE: benchmark_leveldb.sh exists in the current directory
 # After execution of this script, log files are generated in $output_dir.
 # report.txt provides a high level statistics
 #
 # This should be used with the LevelDB fork listed here to use additional test options.
 # For more details on the changes see the blog post listed below.
 #   https://github.com/mdcallag/leveldb-1
 #   http://smalldatum.blogspot.com/2015/04/comparing-leveldb-and-rocksdb-take-2.html
 #
 # This should be run from the parent of the tools directory. The command line is:
 #   [$env_vars] tools/run_flash_bench.sh [list-of-threads]
 #
 # This runs a sequence of tests in the following sequence:
 #   step 1) load - bulkload, compact, fillseq, overwrite
 #   step 2) read-only for each number of threads
 #   step 3) read-write for each number of threads
 #
 # The list of threads is optional and when not set is equivalent to "24".
 # Were list-of-threads specified as "1 2 4" then the tests in steps 2, 3 and
 # 4 above would be repeated for 1, 2 and 4 threads. The tests in step 1 are
 # only run for 1 thread.

 # Test output is written to $OUTPUT_DIR, currently /tmp/output. The performance
 # summary is in $OUTPUT_DIR/report.txt. There is one file in $OUTPUT_DIR per
 # test and the tests are listed below.
 #
 # The environment variables are also optional. The variables are:
 #   NKEYS         - number of key/value pairs to load
 #   NWRITESPERSEC - the writes/second rate limit for the *whilewriting* tests.
 #                   If this is too large then the non-writer threads can get
 #                   starved.
 #   VAL_SIZE      - the length of the value in the key/value pairs loaded.
 #                   You can estimate the size of the test database from this,
 #                   NKEYS and the compression rate (--compression_ratio) set
 #                   in tools/benchmark_leveldb.sh
 #   BLOCK_LENGTH  - value for db_bench --block_size
 #   CACHE_BYTES   - the size of the RocksDB block cache in bytes
 #   DATA_DIR      - directory in which to create database files
 #   DO_SETUP      - when set to 0 then a backup of the database is copied from
 #                   $DATA_DIR.bak to $DATA_DIR and the load tests from step 1
 #                   This allows tests from steps 2, 3 to be repeated faster.
 #   SAVE_SETUP    - saves a copy of the database at the end of step 1 to
 #                   $DATA_DIR.bak.

 # Size constants
 K=1024
 M=$((1024 * K))
 G=$((1024 * M))

 num_keys=${NKEYS:-$((1 * G))}
 wps=${NWRITESPERSEC:-$((10 * K))}
 vs=${VAL_SIZE:-400}
 cs=${CACHE_BYTES:-$(( 1 * G ))}
 bs=${BLOCK_LENGTH:-4096}

 # If no command line arguments then run for 24 threads.
 if [[ $# -eq 0 ]]; then
   nthreads=( 24 )
 else
   nthreads=( "$@" )
 fi

 for num_thr in "${nthreads[@]}" ; do
   echo Will run for $num_thr threads
 done

 # Update these parameters before execution !!!
 db_dir=${DATA_DIR:-"/tmp/rocksdb/"}

 do_setup=${DO_SETUP:-1}
 save_setup=${SAVE_SETUP:-0}

 output_dir="${TMPDIR:-/tmp}/output"

 ARGS="\
 OUTPUT_DIR=$output_dir \
 NUM_KEYS=$num_keys \
 DB_DIR=$db_dir \
 VALUE_SIZE=$vs \
 BLOCK_SIZE=$bs \
 CACHE_SIZE=$cs"

 mkdir -p $output_dir
 echo -e "ops/sec\tmb/sec\tusec/op\tavg\tp50\tTest" \
   > $output_dir/report.txt

 # Notes on test sequence:
 #   step 1) Setup database via sequential fill followed by overwrite to fragment it.
 #           Done without setting DURATION to make sure that overwrite does $num_keys writes
 #   step 2) read-only tests for all levels of concurrency requested
 #   step 3) non read-only tests for all levels of concurrency requested

 ###### Setup the database

 if [[ $do_setup != 0 ]]; then
   echo Doing setup

   # Test 2a: sequential fill with large values to get peak ingest
   #          adjust NUM_KEYS given the use of larger values
   env $ARGS BLOCK_SIZE=$((1 * M)) VALUE_SIZE=$((32 * K)) NUM_KEYS=$(( num_keys / 64 )) \
        ./tools/benchmark_leveldb.sh fillseq

   # Test 2b: sequential fill with the configured value size
   env $ARGS ./tools/benchmark_leveldb.sh fillseq

   # Test 3: single-threaded overwrite
   env $ARGS NUM_THREADS=1 DB_BENCH_NO_SYNC=1 ./tools/benchmark_leveldb.sh overwrite

 else
   echo Restoring from backup

   rm -rf $db_dir

   if [ ! -d ${db_dir}.bak ]; then
     echo Database backup does not exist at ${db_dir}.bak
     exit -1
   fi

   echo Restore database from ${db_dir}.bak
   cp -p -r ${db_dir}.bak $db_dir
 fi

 if [[ $save_setup != 0 ]]; then
   echo Save database to ${db_dir}.bak
   cp -p -r $db_dir ${db_dir}.bak
 fi

 ###### Read-only tests

 for num_thr in "${nthreads[@]}" ; do
   # Test 4: random read
   env $ARGS NUM_THREADS=$num_thr ./tools/benchmark_leveldb.sh readrandom

 done

 ###### Non read-only tests

 for num_thr in "${nthreads[@]}" ; do
   # Test 7: overwrite with sync=0
   env $ARGS NUM_THREADS=$num_thr DB_BENCH_NO_SYNC=1 \
     ./tools/benchmark_leveldb.sh overwrite

   # Test 8: overwrite with sync=1
   # Not run for now because LevelDB db_bench doesn't have an option to limit the
   # test run to X seconds and doing sync-per-commit for --num can take too long.
   # env $ARGS NUM_THREADS=$num_thr ./tools/benchmark_leveldb.sh overwrite

   # Test 11: random read while writing
   env $ARGS NUM_THREADS=$num_thr WRITES_PER_SECOND=$wps \
     ./tools/benchmark_leveldb.sh readwhilewriting

 done

 echo bulkload > $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep bulkload $output_dir/report.txt >> $output_dir/report2.txt
 echo fillseq >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep fillseq $output_dir/report.txt >> $output_dir/report2.txt
 echo overwrite sync=0 >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep overwrite $output_dir/report.txt | grep \.s0  >> $output_dir/report2.txt
 echo overwrite sync=1 >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep overwrite $output_dir/report.txt | grep \.s1  >> $output_dir/report2.txt
 echo readrandom >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep readrandom $output_dir/report.txt  >> $output_dir/report2.txt
 echo readwhile >> $output_dir/report2.txt >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep readwhilewriting $output_dir/report.txt >> $output_dir/report2.txt

 cat $output_dir/report2.txt
	#!/usr/bin/env bash
	# REQUIRE: benchmark_leveldb.sh exists in the current directory
	# After execution of this script, log files are generated in $output_dir.
	# report.txt provides a high level statistics
	#
	# This should be used with the LevelDB fork listed here to use additional test options.
	# For more details on the changes see the blog post listed below.
	# https://github.com/mdcallag/leveldb-1
	# http://smalldatum.blogspot.com/2015/04/comparing-leveldb-and-rocksdb-take-2.html
	#
	# This should be run from the parent of the tools directory. The command line is:
	# [$env_vars] tools/run_flash_bench.sh [list-of-threads]
	#
	# This runs a sequence of tests in the following sequence:
	# step 1) load - bulkload, compact, fillseq, overwrite
	# step 2) read-only for each number of threads
	# step 3) read-write for each number of threads
	#
	# The list of threads is optional and when not set is equivalent to "24".
	# Were list-of-threads specified as "1 2 4" then the tests in steps 2, 3 and
	# 4 above would be repeated for 1, 2 and 4 threads. The tests in step 1 are
	# only run for 1 thread.

	# Test output is written to $OUTPUT_DIR, currently /tmp/output. The performance
	# summary is in $OUTPUT_DIR/report.txt. There is one file in $OUTPUT_DIR per
	# test and the tests are listed below.
	#
	# The environment variables are also optional. The variables are:
	# NKEYS - number of key/value pairs to load
	# NWRITESPERSEC - the writes/second rate limit for the whilewriting tests.
	# If this is too large then the non-writer threads can get
	# starved.
	# VAL_SIZE - the length of the value in the key/value pairs loaded.
	# You can estimate the size of the test database from this,
	# NKEYS and the compression rate (--compression_ratio) set
	# in tools/benchmark_leveldb.sh
	# BLOCK_LENGTH - value for db_bench --block_size
	# CACHE_BYTES - the size of the RocksDB block cache in bytes
	# DATA_DIR - directory in which to create database files
	# DO_SETUP - when set to 0 then a backup of the database is copied from
	# $DATA_DIR.bak to $DATA_DIR and the load tests from step 1
	# This allows tests from steps 2, 3 to be repeated faster.
	# SAVE_SETUP - saves a copy of the database at the end of step 1 to
	# $DATA_DIR.bak.

	# Size constants
	K=1024
	M=$((1024 * K))
	G=$((1024 * M))

	num_keys=${NKEYS:-$((1 * G))}
	wps=${NWRITESPERSEC:-$((10 * K))}
	vs=${VAL_SIZE:-400}
	cs=${CACHE_BYTES:-$(( 1 * G ))}
	bs=${BLOCK_LENGTH:-4096}

	# If no command line arguments then run for 24 threads.
	if [[ $# -eq 0 ]]; then
	nthreads=( 24 )
	else
	nthreads=( "$@" )
	fi

	for num_thr in "${nthreads[@]}" ; do
	echo Will run for $num_thr threads
	done

	# Update these parameters before execution !!!
	db_dir=${DATA_DIR:-"/tmp/rocksdb/"}

	do_setup=${DO_SETUP:-1}
	save_setup=${SAVE_SETUP:-0}

	output_dir="${TMPDIR:-/tmp}/output"

	ARGS="\
	OUTPUT_DIR=$output_dir \
	NUM_KEYS=$num_keys \
	DB_DIR=$db_dir \
	VALUE_SIZE=$vs \
	BLOCK_SIZE=$bs \
	CACHE_SIZE=$cs"

	mkdir -p $output_dir
	echo -e "ops/sec\tmb/sec\tusec/op\tavg\tp50\tTest" \
	> $output_dir/report.txt

	# Notes on test sequence:
	# step 1) Setup database via sequential fill followed by overwrite to fragment it.
	# Done without setting DURATION to make sure that overwrite does $num_keys writes
	# step 2) read-only tests for all levels of concurrency requested
	# step 3) non read-only tests for all levels of concurrency requested

	###### Setup the database

	if [[ $do_setup != 0 ]]; then
	echo Doing setup

	# Test 2a: sequential fill with large values to get peak ingest
	# adjust NUM_KEYS given the use of larger values
	env $ARGS BLOCK_SIZE=$((1 * M)) VALUE_SIZE=$((32 * K)) NUM_KEYS=$(( num_keys / 64 )) \
	./tools/benchmark_leveldb.sh fillseq

	# Test 2b: sequential fill with the configured value size
	env $ARGS ./tools/benchmark_leveldb.sh fillseq

	# Test 3: single-threaded overwrite
	env $ARGS NUM_THREADS=1 DB_BENCH_NO_SYNC=1 ./tools/benchmark_leveldb.sh overwrite

	else
	echo Restoring from backup

	rm -rf $db_dir

	if [ ! -d ${db_dir}.bak ]; then
	echo Database backup does not exist at ${db_dir}.bak
	exit -1
	fi

	echo Restore database from ${db_dir}.bak
	cp -p -r ${db_dir}.bak $db_dir
	fi

	if [[ $save_setup != 0 ]]; then
	echo Save database to ${db_dir}.bak
	cp -p -r $db_dir ${db_dir}.bak
	fi

	###### Read-only tests

	for num_thr in "${nthreads[@]}" ; do
	# Test 4: random read
	env $ARGS NUM_THREADS=$num_thr ./tools/benchmark_leveldb.sh readrandom

	done

	###### Non read-only tests

	for num_thr in "${nthreads[@]}" ; do
	# Test 7: overwrite with sync=0
	env $ARGS NUM_THREADS=$num_thr DB_BENCH_NO_SYNC=1 \
	./tools/benchmark_leveldb.sh overwrite

	# Test 8: overwrite with sync=1
	# Not run for now because LevelDB db_bench doesn't have an option to limit the
	# test run to X seconds and doing sync-per-commit for --num can take too long.
	# env $ARGS NUM_THREADS=$num_thr ./tools/benchmark_leveldb.sh overwrite

	# Test 11: random read while writing
	env $ARGS NUM_THREADS=$num_thr WRITES_PER_SECOND=$wps \
	./tools/benchmark_leveldb.sh readwhilewriting

	done

	echo bulkload > $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep bulkload $output_dir/report.txt >> $output_dir/report2.txt
	echo fillseq >> $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep fillseq $output_dir/report.txt >> $output_dir/report2.txt
	echo overwrite sync=0 >> $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep overwrite $output_dir/report.txt \| grep \.s0 >> $output_dir/report2.txt
	echo overwrite sync=1 >> $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep overwrite $output_dir/report.txt \| grep \.s1 >> $output_dir/report2.txt
	echo readrandom >> $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep readrandom $output_dir/report.txt >> $output_dir/report2.txt
	echo readwhile >> $output_dir/report2.txt >> $output_dir/report2.txt
	head -1 $output_dir/report.txt >> $output_dir/report2.txt
	grep readwhilewriting $output_dir/report.txt >> $output_dir/report2.txt

	cat $output_dir/report2.txt