Update benchmarks used to measure subcompaction performance

Summary: After closely working with Mark, Siying, and Yueh-Hsuan this set of changes reflects the updates needed to measure RocksDB subcompaction performance in a correct manner. The essence of the benchmark is executing `fillrandom` followed by `compact` with the correct set of options for various number of subcompactions specified. Test Plan: Tested internally to verify correctness and reliability. Reviewers: sdong, yhchiang, MarkCallaghan Reviewed By: MarkCallaghan Subscribers: dhruba Differential Revision: https://reviews.facebook.net/D55089
2016-03-04 12:32:11 -08:00 · 2016-03-04 12:32:11 -08:00 · 68189f7e1b
commit 68189f7e1b
parent dfe96c72c3
2 changed files with 82 additions and 24 deletions
--- a/tools/benchmark.sh
+++ b/tools/benchmark.sh
@ -8,6 +8,14 @@ if [ $# -ne 1 ]; then
  exit 0
 fi
 # Make it easier to run only the compaction test. Getting valid data requires
 # a number of iterations and having an ability to run the test separately from
 # rest of the benchmarks helps.
 if [ "$COMPACTION_TEST" == "1" -a "$1" != "universal_compaction" ]; then
  echo "Skipping $1 because it's not a compaction test."
  exit 0
 fi
 # size constants
 K=1024
 M=$((1024 * K))
@ -104,6 +112,23 @@ params_bulkload="$const_params --max_background_compactions=16 --max_background_
                 --level0_slowdown_writes_trigger=$((10 * M)) \
                 --level0_stop_writes_trigger=$((10 * M))"
 #
 # Tune values for level and universal compaction.
 # For universal compaction, these level0_* options mean total sorted of runs in
 # LSM. In level-based compaction, it means number of L0 files.
 #
 params_level_compact="$const_params --max_background_compactions=16 \
                --max_background_flushes=7 \
                --level0_file_num_compaction_trigger=4 \
                --level0_slowdown_writes_trigger=16 \
                --level0_stop_writes_trigger=20"
 params_univ_compact="$const_params --max_background_compactions=16 \
                --max_background_flushes=7 \
                --level0_file_num_compaction_trigger=8 \
                --level0_slowdown_writes_trigger=16 \
                --level0_stop_writes_trigger=20"
 function summarize_result {
  test_out=$1
  test_name=$2
@ -162,29 +187,64 @@ function run_bulkload {
  eval $cmd
 }
-function run_univ_compaction_worker {
+function run_manual_compaction_worker {
-  # Worker function intended to be called from run_univ_compaction.
+  # This runs with a vector memtable and the WAL disabled to load faster.
-  echo -e "\nCompacting ...\n"
+  # It is still crash safe and the client can discover where to restart a
  # load after a crash. I think this is a good way to load.
  echo "Bulk loading $num_keys random keys for manual compaction."
-  compact_output_file=$output_dir/benchmark_univ_compact_sub_$3.t${num_threads}.s${syncval}.log
+  fillrandom_output_file=$output_dir/benchmark_man_compact_fillrandom_$3.log
  man_compact_output_log=$output_dir/benchmark_man_compact_$3.log
-  # The essence of the command is borrowed from run_change overwrite with
+  if [ "$2" == "1" ]; then
-  # compaction specific options being added.
+    extra_params=$params_univ_compact
-  cmd="./db_bench --benchmarks=overwrite \
+  else
-       --use_existing_db=1 \
+    extra_params=$params_level_compact
-       --sync=$syncval \
+  fi
-       $params_w \
+
  # Make sure that fillrandom uses the same compaction options as compact.
  cmd="./db_bench --benchmarks=fillrandom \
       --use_existing_db=0 \
       --disable_auto_compactions=0 \
       --sync=0 \
       $extra_params \
       --threads=$num_threads \
       --merge_operator=\"put\" \
       --seed=$( date +%s ) \
       --compaction_measure_io_stats=$1 \
       --compaction_style=$2 \
       --subcompactions=$3 \
-       2>&1 | tee -a $compact_output_file"
+       --memtablerep=vector \
-  echo $cmd | tee $compact_output_file
+       --disable_wal=1 \
       --seed=$( date +%s ) \
       2>&1 | tee -a $fillrandom_output_file"
  echo $cmd | tee $fillrandom_output_file
  eval $cmd
-  summarize_result $compact_output_file univ_compact_sub_comp_$3 overwrite
+  summarize_result $fillrandom_output_file man_compact_fillrandom_$3 fillrandom
  echo "Compacting with $3 subcompactions specified ..."
  # This is the part we're really interested in. Given that compact benchmark
  # doesn't output regular statistics then we'll just use the time command to
  # measure how long this step takes.
  cmd="{ \
       time ./db_bench --benchmarks=compact \
       --use_existing_db=1 \
       --disable_auto_compactions=0 \
       --sync=0 \
       $extra_params \
       --threads=$num_threads \
       --compaction_measure_io_stats=$1 \
       --compaction_style=$2 \
       --subcompactions=$3 \
       ;}
       2>&1 | tee -a $man_compact_output_log"
  echo $cmd | tee $man_compact_output_log
  eval $cmd
  # Can't use summarize_result here. One way to analyze the results is to run
  # "grep real" on the resulting log files.
 }
 function run_univ_compaction {
@ -198,14 +258,16 @@ function run_univ_compaction {
  # by allowing the usage of { 1, 2, 4, 8, 16 } threads for different runs.
  subcompactions=("1" "2" "4" "8" "16")
-  # Have a separate suffix for each experiment so that separate results will be
+  # Do the real work of running various experiments.
-  # persisted.
+
  # Run the compaction benchmark which is based on bulkload. It pretty much
  # consists of running manual compaction with different number of subcompaction
  # threads.
  log_suffix=1
  # Do the real work of running various experiments.
  for ((i=0; i < ${#subcompactions[@]}; i++))
  do
-    run_univ_compaction_worker $io_stats $compaction_style ${subcompactions[$i]} $log_suffix
+    run_manual_compaction_worker $io_stats $compaction_style ${subcompactions[$i]} $log_suffix
    ((log_suffix++))
  done
 }
--- a/tools/run_flash_bench.sh
+++ b/tools/run_flash_bench.sh
@ -267,7 +267,7 @@ done
 ###### Universal compaction tests.
 # Use a single thread to reduce the variability in the benchmark.
-env $ARGS NUM_THREADS=1 ./tools/benchmark.sh universal_compaction
+env $ARGS COMPACTION_TEST=1 NUM_THREADS=1 ./tools/benchmark.sh universal_compaction
 if [[ $skip_low_pri_tests != 1 ]]; then
  echo bulkload > $output_dir/report2.txt
@ -355,8 +355,4 @@ if [[ $skip_low_pri_tests != 1 ]]; then
  grep revrangewhilemerg $output_dir/report.txt >> $output_dir/report2.txt
 fi
 echo universal_compaction >> $output_dir/report2.txt
 head -1 $output_dir/report.txt >> $output_dir/report2.txt
 grep univ_compact $output_dir/report.txt >> $output_dir/report2.txt
 cat $output_dir/report2.txt