src/kudu/util/test_util.cc - kudu - Git at Google

 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
 // regarding copyright ownership.  The ASF licenses this file
 // to you under the Apache License, Version 2.0 (the
 // "License"); you may not use this file except in compliance
 // with the License.  You may obtain a copy of the License at
 //
 //   http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing,
 // software distributed under the License is distributed on an
 // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 // KIND, either express or implied.  See the License for the
 // specific language governing permissions and limitations
 // under the License.

 #include "kudu/util/test_util.h"

 #include <limits.h>
 #include <unistd.h>

 #include <cerrno>
 #include <cstdlib>
 #include <limits>
 #include <map>
 #include <memory>
 #include <ostream>
 #include <string>
 #include <utility>
 #include <vector>

 #ifdef __APPLE__
 #include <fcntl.h>
 #include <sys/param.h> // for MAXPATHLEN
 #endif

 #include <gflags/gflags.h>
 #include <glog/logging.h>
 #include <gtest/gtest-spi.h>

 #include "kudu/gutil/strings/numbers.h"
 #include "kudu/gutil/strings/split.h"
 #include "kudu/gutil/strings/strcat.h"
 #include "kudu/gutil/strings/stringpiece.h"
 #include "kudu/gutil/strings/strip.h"
 #include "kudu/gutil/strings/substitute.h"
 #include "kudu/gutil/strings/util.h"
 #include "kudu/gutil/walltime.h"
 #include "kudu/util/env.h"
 #include "kudu/util/faststring.h"
 #include "kudu/util/flags.h"
 #include "kudu/util/oid_generator.h"
 #include "kudu/util/path_util.h"
 #include "kudu/util/scoped_cleanup.h"
 #include "kudu/util/slice.h"
 #include "kudu/util/spinlock_profiling.h"
 #include "kudu/util/status.h"
 #include "kudu/util/string_case.h"
 #include "kudu/util/subprocess.h"

 DEFINE_string(test_leave_files, "on_failure",
               "Whether to leave test files around after the test run. "
               " Valid values are 'always', 'on_failure', or 'never'");

 DEFINE_int32(test_random_seed, 0, "Random seed to use for randomized tests");

 DECLARE_string(time_source);

 using std::string;
 using std::vector;
 using strings::Substitute;

 namespace kudu {

 const char* kInvalidPath = "/dev/invalid-path-for-kudu-tests";
 static const char* const kSlowTestsEnvVar = "KUDU_ALLOW_SLOW_TESTS";
 static const char* const kLargeKeysEnvVar = "KUDU_USE_LARGE_KEYS_IN_TESTS";

 static const uint64_t kTestBeganAtMicros = Env::Default()->NowMicros();

 // Global which production code can check to see if it is running
 // in a GTest environment (assuming the test binary links in this module,
 // which is typically a good assumption).
 //
 // This can be checked using the 'IsGTest()' function from test_util_prod.cc.
 bool g_is_gtest = true;

 ///////////////////////////////////////////////////
 // KuduTest
 ///////////////////////////////////////////////////

 KuduTest::KuduTest()
     : env_(Env::Default()),
       flag_saver_(new google::FlagSaver()),
       test_dir_(GetTestDataDirectory()) {
   std::map<const char*, const char*> flags_for_tests = {
     // Disabling fsync() speeds up tests dramatically, and it's safe to do as no
     // tests rely on cutting power to a machine or equivalent.
     {"never_fsync", "true"},
     // Disable redaction.
     {"redact", "none"},
     // For a generic Kudu test, the local wall-clock time is good enough even
     // if it's not synchronized by NTP. All test components are run at the same
     // node, so there aren't multiple time sources to synchronize.
     {"time_source", "system_unsync"},
   };
   if (!UseLargeKeys()) {
     // Reduce default RSA key length for faster tests. We are using strong/high
     // TLS v1.2 cipher suites, so minimum possible for TLS-related RSA keys is
     // 768 bits. Java security policies in tests tweaked appropriately to allow
     // for using smaller RSA keys in certificates. As for the TSK keys, 512 bits
     // is the minimum since the SHA256 digest is used for token
     // signing/verification.
     flags_for_tests.emplace("ipki_server_key_size", "768");
     flags_for_tests.emplace("ipki_ca_key_size", "768");
     flags_for_tests.emplace("tsk_num_rsa_bits", "512");
     // Some OS distros set the default security level higher than 0, so it's
     // necessary to override it to use the key length specified above (which are
     // considered lax and don't work in case of security level 2 or higher).
     flags_for_tests.emplace("openssl_security_level_override", "0");
   }
   for (const auto& e : flags_for_tests) {
     // We don't check for errors here, because we have some default flags that
     // only apply to certain tests. If a flag is defined in a library which
     // the test binary isn't linked with, then SetCommandLineOptionWithMode()
     // reports an error since the flag is unknown to the gflags runtime.
     google::SetCommandLineOptionWithMode(e.first, e.second, google::SET_FLAGS_DEFAULT);
   }
   // If the TEST_TMPDIR variable has been set, then glog will automatically use that
   // as its default log directory. We would prefer that the default log directory
   // instead be the test-case-specific subdirectory.
   FLAGS_log_dir = GetTestDataDirectory();
 }

 KuduTest::~KuduTest() {
   // Reset the flags first to prevent them from affecting test directory cleanup.
   flag_saver_.reset();

   // Clean up the test directory in the destructor instead of a TearDown
   // method. This is better because it ensures that the child-class
   // dtor runs first -- so, if the child class is using a minicluster, etc,
   // we will shut that down before we remove files underneath.
   if (FLAGS_test_leave_files == "always") {
     LOG(INFO) << "-----------------------------------------------";
     LOG(INFO) << "--test_leave_files specified, leaving files in " << test_dir_;
   } else if (FLAGS_test_leave_files == "on_failure" && HasFatalFailure()) {
     LOG(INFO) << "-----------------------------------------------";
     LOG(INFO) << "Had fatal failures, leaving test files at " << test_dir_;
   } else {
     VLOG(1) << "Cleaning up temporary test files...";
     WARN_NOT_OK(env_->DeleteRecursively(test_dir_),
                 "Couldn't remove test files");
   }
 }

 void KuduTest::SetUp() {
   InitSpinLockContentionProfiling();
   OverrideKrb5Environment();
 }

 string KuduTest::GetTestPath(const string& relative_path) const {
   return JoinPathSegments(test_dir_, relative_path);
 }

 void KuduTest::OverrideKrb5Environment() {
   // Set these variables to paths that definitely do not exist and
   // couldn't be accidentally created.
   //
   // Note that if we were to set these to /dev/null, we end up triggering a leak in krb5
   // when it tries to read an empty file as a ticket cache, whereas non-existent files
   // don't have this issue. See MIT krb5 bug #8509.
   //
   // NOTE: we don't simply *unset* the variables, because then we'd still pick up
   // the user's /etc/krb5.conf and other default locations.
   setenv("KRB5_CONFIG", kInvalidPath, 1);
   setenv("KRB5_KTNAME", kInvalidPath, 1);
   setenv("KRB5CCNAME", kInvalidPath, 1);
 }

 ///////////////////////////////////////////////////
 // Test utility functions
 ///////////////////////////////////////////////////

 bool AllowSlowTests() { return GetBooleanEnvironmentVariable(kSlowTestsEnvVar); }

 bool UseLargeKeys() { return GetBooleanEnvironmentVariable(kLargeKeysEnvVar); }

 void OverrideFlagForSlowTests(const std::string& flag_name,
                               const std::string& new_value) {
   // Ensure that the flag is valid.
   google::GetCommandLineFlagInfoOrDie(flag_name.c_str());

   // If we're not running slow tests, don't override it.
   if (!AllowSlowTests()) {
     return;
   }
   google::SetCommandLineOptionWithMode(flag_name.c_str(), new_value.c_str(),
                                        google::SET_FLAG_IF_DEFAULT);
 }

 int SeedRandom() {
   int seed;
   // Initialize random seed
   if (FLAGS_test_random_seed == 0) {
     // Not specified by user
     seed = static_cast<int>(GetCurrentTimeMicros());
   } else {
     seed = FLAGS_test_random_seed;
   }
   LOG(INFO) << "Using random seed: " << seed;
   srand(seed);
   return seed;
 }

 string GetTestDataDirectory() {
   const ::testing::TestInfo* const test_info =
     ::testing::UnitTest::GetInstance()->current_test_info();
   CHECK(test_info) << "Must be running in a gtest unit test to call this function";
   string dir;
   CHECK_OK(Env::Default()->GetTestDirectory(&dir));

   // The directory name includes some strings for specific reasons:
   // - program name: identifies the directory to the test invoker
   // - timestamp and pid: disambiguates with prior runs of the same test
   //
   // e.g. "env-test.TestEnv.TestReadFully.1409169025392361-23600"
   //
   // If the test is sharded, the shard index is also included so that the test
   // invoker can more easily identify all directories belonging to each shard.
   string shard_index_infix;
   const char* shard_index = getenv("GTEST_SHARD_INDEX");
   if (shard_index && shard_index[0] != '\0') {
     shard_index_infix = Substitute("$0.", shard_index);
   }
   dir += Substitute("/$0.$1$2.$3.$4-$5",
     StringReplace(google::ProgramInvocationShortName(), "/", "_", true),
     shard_index_infix,
     StringReplace(test_info->test_case_name(), "/", "_", true),
     StringReplace(test_info->name(), "/", "_", true),
     kTestBeganAtMicros,
     getpid());
   Status s = Env::Default()->CreateDir(dir);
   CHECK(s.IsAlreadyPresent() || s.ok())
     << "Could not create directory " << dir << ": " << s.ToString();
   if (s.ok()) {
     string metadata;

     StrAppend(&metadata, Substitute("PID=$0\n", getpid()));

     StrAppend(&metadata, Substitute("PPID=$0\n", getppid()));

     char* jenkins_build_id = getenv("BUILD_ID");
     if (jenkins_build_id) {
       StrAppend(&metadata, Substitute("BUILD_ID=$0\n", jenkins_build_id));
     }

     CHECK_OK(WriteStringToFile(Env::Default(), metadata,
                                Substitute("$0/test_metadata", dir)));
   }
   return dir;
 }

 string GetTestSocketPath(const string& name) {
   string dir;
   CHECK_OK(Env::Default()->GetTestDirectory(&dir));
   ObjectIdGenerator generator;
   string uuid = generator.Next();
   return JoinPathSegments(dir, Substitute("$0-$1.sock", name, uuid));
 }

 string GetTestExecutableDirectory() {
   string exec;
   CHECK_OK(Env::Default()->GetExecutablePath(&exec));
   return DirName(exec);
 }

 void AssertEventually(const std::function<void(void)>& f,
                       const MonoDelta& timeout,
                       AssertBackoff backoff) {
   const MonoTime deadline = MonoTime::Now() + timeout;
   {
     // Disable gtest's "on failure" behavior, or else the assertion failures
     // inside our attempts will cause the test to end even though we would
     // like to retry.
     bool old_break_on_failure = testing::FLAGS_gtest_break_on_failure;
     bool old_throw_on_failure = testing::FLAGS_gtest_throw_on_failure;
     auto c = MakeScopedCleanup([old_break_on_failure, old_throw_on_failure]() {
       testing::FLAGS_gtest_break_on_failure = old_break_on_failure;
       testing::FLAGS_gtest_throw_on_failure = old_throw_on_failure;
     });
     testing::FLAGS_gtest_break_on_failure = false;
     testing::FLAGS_gtest_throw_on_failure = false;

     for (int attempts = 0; MonoTime::Now() < deadline; attempts++) {
       // Capture any assertion failures within this scope (i.e. from their function)
       // into 'results'
       testing::TestPartResultArray results;
       testing::ScopedFakeTestPartResultReporter reporter(
           testing::ScopedFakeTestPartResultReporter::INTERCEPT_ONLY_CURRENT_THREAD,
           &results);
       f();

       // Determine whether their function produced any new test failure results.
       bool has_failures = false;
       for (int i = 0; i < results.size(); i++) {
         has_failures |= results.GetTestPartResult(i).failed();
       }
       if (!has_failures) {
         return;
       }

       // If they had failures, sleep and try again.
       int sleep_ms;
       switch (backoff) {
         case AssertBackoff::EXPONENTIAL:
           sleep_ms = (attempts < 10) ? (1 << attempts) : 1000;
           break;
         case AssertBackoff::NONE:
           sleep_ms = 1;
           break;
         default:
           LOG(FATAL) << "Unknown backoff type";
       }
       SleepFor(MonoDelta::FromMilliseconds(sleep_ms));
     }
   }

   // If we ran out of time looping, run their function one more time
   // without capturing its assertions. This way the assertions will
   // propagate back out to the normal test reporter. Of course it's
   // possible that it will pass on this last attempt, but that's OK
   // too, since we aren't trying to be that strict about the deadline.
   f();
   if (testing::Test::HasFatalFailure()) {
     ADD_FAILURE() << "Timed out waiting for assertion to pass.";
   }
 }

 int CountOpenFds(Env* env, const string& path_pattern) {
   static const char* kProcSelfFd =
 #if defined(__APPLE__)
     "/dev/fd";
 #else
     "/proc/self/fd";
 #endif // defined(__APPLE__)
   faststring path_buf;
   vector<string> children;
   CHECK_OK(env->GetChildren(kProcSelfFd, &children));
   int num_fds = 0;
   for (const auto& c : children) {
     // Skip '.' and '..'.
     if (c == "." || c == "..") {
       continue;
     }
     int32_t fd;
     CHECK(safe_strto32(c, &fd)) << "Unexpected file in fd list: " << c;
 #ifdef __APPLE__
     path_buf.resize(MAXPATHLEN);
     if (fcntl(fd, F_GETPATH, path_buf.data()) != 0) {
       if (errno == EBADF) {
         // The file was closed while we were looping. This is likely the
         // actual file descriptor used for opening /proc/fd itself.
         continue;
       }
       PLOG(FATAL) << "Unknown error in fcntl(F_GETPATH): " << fd;
     }
     char* buf_data = reinterpret_cast<char*>(path_buf.data());
     path_buf.resize(strlen(buf_data));
 #else
     path_buf.resize(PATH_MAX);
     char* buf_data = reinterpret_cast<char*>(path_buf.data());
     auto proc_file = JoinPathSegments(kProcSelfFd, c);
     int path_len = readlink(proc_file.c_str(), buf_data, path_buf.size());
     if (path_len < 0) {
       if (errno == ENOENT) {
         // The file was closed while we were looping. This is likely the
         // actual file descriptor used for opening /proc/fd itself.
         continue;
       }
       PLOG(FATAL) << "Unknown error in readlink: " << proc_file;
     }
     path_buf.resize(path_len);
 #endif
     if (!MatchPattern(path_buf.ToString(), path_pattern)) {
       continue;
     }
     num_fds++;
   }

   return num_fds;
 }

 namespace {
 Status WaitForBind(pid_t pid, uint16_t* port,
                    const vector<string>& addresses,
                    const char* kind,
                    MonoDelta timeout) {
   static const vector<string> kWildcard = { "0.0.0.0" };

   // In general, processes do not expose the port they bind to, and
   // reimplementing lsof involves parsing a lot of files in /proc/. So,
   // requiring lsof for tests and parsing its output seems more
   // straight-forward. We call lsof in a loop since it typically takes a long
   // time for it to initialize and bind a port.

   string lsof;
   RETURN_NOT_OK(FindExecutable("lsof", {"/sbin", "/usr/sbin"}, &lsof));

   const vector<string> cmd = {
     lsof, "-wbnP", "-Ffn",
     "-p", std::to_string(pid),
     "-a", "-i", kind
   };

   // The '-Ffn' flag gets lsof to output something like:
   //   p5801
   //   f548
   //   n127.0.0.1:43954->127.0.0.1:43617
   //   f549
   //   n*:8038
   //
   // The first line is the pid. We ignore it.
   // Subsequent lines come in pairs. In each pair, the first half of the pair
   // is file descriptor number, we ignore it.
   // The second half has the bind address and port.
   //
   // In this example, the first pair is an outbound TCP socket. We ignore it.
   // The second pair is the listening TCP socket bind address and port.
   //
   // We use the first encountered listening TCP socket, since that's most likely
   // to be the primary service port. When searching, we use the provided bind
   // address if there is any, otherwise we use '*' (same as '0.0.0.0') which
   // matches all addresses on the local machine.
   const MonoTime deadline = MonoTime::Now() + timeout;
   const auto& addresses_to_check = addresses.empty() ? kWildcard : addresses;
   for (int64_t i = 1; ; ++i) {
     for (const auto& addr : addresses_to_check) {
       string addr_pattern = Substitute("n$0:", addr == "0.0.0.0" ? "*" : addr);
       string lsof_out;
       int32_t p = -1;
       Status s = Subprocess::Call(cmd, "", &lsof_out).AndThen([&] () {
         StripTrailingNewline(&lsof_out);
         vector<string> lines = strings::Split(lsof_out, "\n");
         for (int index = 2; index < lines.size(); index += 2) {
           StringPiece cur_line(lines[index]);
           if (HasPrefixString(cur_line.ToString(), addr_pattern) &&
               !cur_line.contains("->")) {
             cur_line.remove_prefix(addr_pattern.size());
             if (!safe_strto32(cur_line.data(), cur_line.size(), &p)) {
               return Status::RuntimeError("unexpected lsof output", lsof_out);
             }

             return Status::OK();
           }
         }

         return Status::RuntimeError("unexpected lsof output", lsof_out);
       });

       if (s.ok()) {
         CHECK(p > 0 && p < std::numeric_limits<uint16_t>::max())
             << "parsed invalid port: " << p;
         VLOG(1) << "Determined bound port: " << p;
         *port = static_cast<uint16_t>(p);

         return Status::OK();
       }
       if (deadline < MonoTime::Now()) {
         return s;
       }
     }
     SleepFor(MonoDelta::FromMilliseconds(i * 10));
   }

   // Should not reach here.
   LOG(FATAL) << "could not determine bound port the process";
   __builtin_unreachable();
 }
 } // anonymous namespace

 Status WaitForTcpBind(pid_t pid, uint16_t* port,
                       const vector<string>& addresses,
                       MonoDelta timeout) {
   return WaitForBind(pid, port, addresses, "4TCP", timeout);
 }

 Status WaitForUdpBind(pid_t pid, uint16_t* port,
                       const vector<string>& addresses,
                       MonoDelta timeout) {
   return WaitForBind(pid, port, addresses, "4UDP", timeout);
 }

 Status FindHomeDir(const string& name, const string& bin_dir, string* home_dir) {
   string name_upper;
   ToUpperCase(name, &name_upper);

   string env_var = Substitute("$0_HOME", name_upper);
   const char* env = std::getenv(env_var.c_str());
   string dir = env == nullptr ? JoinPathSegments(bin_dir, Substitute("$0-home", name)) : env;

   if (!Env::Default()->FileExists(dir)) {
     return Status::NotFound(Substitute("$0 directory does not exist", env_var), dir);
   }
   *home_dir = dir;
   return Status::OK();
 }

 } // namespace kudu
	// Licensed to the Apache Software Foundation (ASF) under one
	// or more contributor license agreements. See the NOTICE file
	// distributed with this work for additional information
	// regarding copyright ownership. The ASF licenses this file
	// to you under the Apache License, Version 2.0 (the
	// "License"); you may not use this file except in compliance
	// with the License. You may obtain a copy of the License at
	//
	// http://www.apache.org/licenses/LICENSE-2.0
	//
	// Unless required by applicable law or agreed to in writing,
	// software distributed under the License is distributed on an
	// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	// KIND, either express or implied. See the License for the
	// specific language governing permissions and limitations
	// under the License.

	#include "kudu/util/test_util.h"

	#include <limits.h>
	#include <unistd.h>

	#include <cerrno>
	#include <cstdlib>
	#include <limits>
	#include <map>
	#include <memory>
	#include <ostream>
	#include <string>
	#include <utility>
	#include <vector>

	#ifdef __APPLE__
	#include <fcntl.h>
	#include <sys/param.h> // for MAXPATHLEN
	#endif

	#include <gflags/gflags.h>
	#include <glog/logging.h>
	#include <gtest/gtest-spi.h>

	#include "kudu/gutil/strings/numbers.h"
	#include "kudu/gutil/strings/split.h"
	#include "kudu/gutil/strings/strcat.h"
	#include "kudu/gutil/strings/stringpiece.h"
	#include "kudu/gutil/strings/strip.h"
	#include "kudu/gutil/strings/substitute.h"
	#include "kudu/gutil/strings/util.h"
	#include "kudu/gutil/walltime.h"
	#include "kudu/util/env.h"
	#include "kudu/util/faststring.h"
	#include "kudu/util/flags.h"
	#include "kudu/util/oid_generator.h"
	#include "kudu/util/path_util.h"
	#include "kudu/util/scoped_cleanup.h"
	#include "kudu/util/slice.h"
	#include "kudu/util/spinlock_profiling.h"
	#include "kudu/util/status.h"
	#include "kudu/util/string_case.h"
	#include "kudu/util/subprocess.h"

	DEFINE_string(test_leave_files, "on_failure",
	"Whether to leave test files around after the test run. "
	" Valid values are 'always', 'on_failure', or 'never'");

	DEFINE_int32(test_random_seed, 0, "Random seed to use for randomized tests");

	DECLARE_string(time_source);

	using std::string;
	using std::vector;
	using strings::Substitute;

	namespace kudu {

	const char* kInvalidPath = "/dev/invalid-path-for-kudu-tests";
	static const char* const kSlowTestsEnvVar = "KUDU_ALLOW_SLOW_TESTS";
	static const char* const kLargeKeysEnvVar = "KUDU_USE_LARGE_KEYS_IN_TESTS";

	static const uint64_t kTestBeganAtMicros = Env::Default()->NowMicros();

	// Global which production code can check to see if it is running
	// in a GTest environment (assuming the test binary links in this module,
	// which is typically a good assumption).
	//
	// This can be checked using the 'IsGTest()' function from test_util_prod.cc.
	bool g_is_gtest = true;

	///////////////////////////////////////////////////
	// KuduTest
	///////////////////////////////////////////////////

	KuduTest::KuduTest()
	: env_(Env::Default()),
	flag_saver_(new google::FlagSaver()),
	test_dir_(GetTestDataDirectory()) {
	std::map<const char, const char> flags_for_tests = {
	// Disabling fsync() speeds up tests dramatically, and it's safe to do as no
	// tests rely on cutting power to a machine or equivalent.
	{"never_fsync", "true"},
	// Disable redaction.
	{"redact", "none"},
	// For a generic Kudu test, the local wall-clock time is good enough even
	// if it's not synchronized by NTP. All test components are run at the same
	// node, so there aren't multiple time sources to synchronize.
	{"time_source", "system_unsync"},
	};
	if (!UseLargeKeys()) {
	// Reduce default RSA key length for faster tests. We are using strong/high
	// TLS v1.2 cipher suites, so minimum possible for TLS-related RSA keys is
	// 768 bits. Java security policies in tests tweaked appropriately to allow
	// for using smaller RSA keys in certificates. As for the TSK keys, 512 bits
	// is the minimum since the SHA256 digest is used for token
	// signing/verification.
	flags_for_tests.emplace("ipki_server_key_size", "768");
	flags_for_tests.emplace("ipki_ca_key_size", "768");
	flags_for_tests.emplace("tsk_num_rsa_bits", "512");
	// Some OS distros set the default security level higher than 0, so it's
	// necessary to override it to use the key length specified above (which are
	// considered lax and don't work in case of security level 2 or higher).
	flags_for_tests.emplace("openssl_security_level_override", "0");
	}
	for (const auto& e : flags_for_tests) {
	// We don't check for errors here, because we have some default flags that
	// only apply to certain tests. If a flag is defined in a library which
	// the test binary isn't linked with, then SetCommandLineOptionWithMode()
	// reports an error since the flag is unknown to the gflags runtime.
	google::SetCommandLineOptionWithMode(e.first, e.second, google::SET_FLAGS_DEFAULT);
	}
	// If the TEST_TMPDIR variable has been set, then glog will automatically use that
	// as its default log directory. We would prefer that the default log directory
	// instead be the test-case-specific subdirectory.
	FLAGS_log_dir = GetTestDataDirectory();
	}

	KuduTest::~KuduTest() {
	// Reset the flags first to prevent them from affecting test directory cleanup.
	flag_saver_.reset();

	// Clean up the test directory in the destructor instead of a TearDown
	// method. This is better because it ensures that the child-class
	// dtor runs first -- so, if the child class is using a minicluster, etc,
	// we will shut that down before we remove files underneath.
	if (FLAGS_test_leave_files == "always") {
	LOG(INFO) << "-----------------------------------------------";
	LOG(INFO) << "--test_leave_files specified, leaving files in " << test_dir_;
	} else if (FLAGS_test_leave_files == "on_failure" && HasFatalFailure()) {
	LOG(INFO) << "-----------------------------------------------";
	LOG(INFO) << "Had fatal failures, leaving test files at " << test_dir_;
	} else {
	VLOG(1) << "Cleaning up temporary test files...";
	WARN_NOT_OK(env_->DeleteRecursively(test_dir_),
	"Couldn't remove test files");
	}
	}

	void KuduTest::SetUp() {
	InitSpinLockContentionProfiling();
	OverrideKrb5Environment();
	}

	string KuduTest::GetTestPath(const string& relative_path) const {
	return JoinPathSegments(test_dir_, relative_path);
	}

	void KuduTest::OverrideKrb5Environment() {
	// Set these variables to paths that definitely do not exist and
	// couldn't be accidentally created.
	//
	// Note that if we were to set these to /dev/null, we end up triggering a leak in krb5
	// when it tries to read an empty file as a ticket cache, whereas non-existent files
	// don't have this issue. See MIT krb5 bug #8509.
	//
	// NOTE: we don't simply unset the variables, because then we'd still pick up
	// the user's /etc/krb5.conf and other default locations.
	setenv("KRB5_CONFIG", kInvalidPath, 1);
	setenv("KRB5_KTNAME", kInvalidPath, 1);
	setenv("KRB5CCNAME", kInvalidPath, 1);
	}

	///////////////////////////////////////////////////
	// Test utility functions
	///////////////////////////////////////////////////

	bool AllowSlowTests() { return GetBooleanEnvironmentVariable(kSlowTestsEnvVar); }

	bool UseLargeKeys() { return GetBooleanEnvironmentVariable(kLargeKeysEnvVar); }

	void OverrideFlagForSlowTests(const std::string& flag_name,
	const std::string& new_value) {
	// Ensure that the flag is valid.
	google::GetCommandLineFlagInfoOrDie(flag_name.c_str());

	// If we're not running slow tests, don't override it.
	if (!AllowSlowTests()) {
	return;
	}
	google::SetCommandLineOptionWithMode(flag_name.c_str(), new_value.c_str(),
	google::SET_FLAG_IF_DEFAULT);
	}

	int SeedRandom() {
	int seed;
	// Initialize random seed
	if (FLAGS_test_random_seed == 0) {
	// Not specified by user
	seed = static_cast<int>(GetCurrentTimeMicros());
	} else {
	seed = FLAGS_test_random_seed;
	}
	LOG(INFO) << "Using random seed: " << seed;
	srand(seed);
	return seed;
	}

	string GetTestDataDirectory() {
	const ::testing::TestInfo* const test_info =
	::testing::UnitTest::GetInstance()->current_test_info();
	CHECK(test_info) << "Must be running in a gtest unit test to call this function";
	string dir;
	CHECK_OK(Env::Default()->GetTestDirectory(&dir));

	// The directory name includes some strings for specific reasons:
	// - program name: identifies the directory to the test invoker
	// - timestamp and pid: disambiguates with prior runs of the same test
	//
	// e.g. "env-test.TestEnv.TestReadFully.1409169025392361-23600"
	//
	// If the test is sharded, the shard index is also included so that the test
	// invoker can more easily identify all directories belonging to each shard.
	string shard_index_infix;
	const char* shard_index = getenv("GTEST_SHARD_INDEX");
	if (shard_index && shard_index[0] != '\0') {
	shard_index_infix = Substitute("$0.", shard_index);
	}
	dir += Substitute("/$0.$1$2.$3.$4-$5",
	StringReplace(google::ProgramInvocationShortName(), "/", "_", true),
	shard_index_infix,
	StringReplace(test_info->test_case_name(), "/", "_", true),
	StringReplace(test_info->name(), "/", "_", true),
	kTestBeganAtMicros,
	getpid());
	Status s = Env::Default()->CreateDir(dir);
	CHECK(s.IsAlreadyPresent() \|\| s.ok())
	<< "Could not create directory " << dir << ": " << s.ToString();
	if (s.ok()) {
	string metadata;

	StrAppend(&metadata, Substitute("PID=$0\n", getpid()));

	StrAppend(&metadata, Substitute("PPID=$0\n", getppid()));

	char* jenkins_build_id = getenv("BUILD_ID");
	if (jenkins_build_id) {
	StrAppend(&metadata, Substitute("BUILD_ID=$0\n", jenkins_build_id));
	}

	CHECK_OK(WriteStringToFile(Env::Default(), metadata,
	Substitute("$0/test_metadata", dir)));
	}
	return dir;
	}

	string GetTestSocketPath(const string& name) {
	string dir;
	CHECK_OK(Env::Default()->GetTestDirectory(&dir));
	ObjectIdGenerator generator;
	string uuid = generator.Next();
	return JoinPathSegments(dir, Substitute("$0-$1.sock", name, uuid));
	}

	string GetTestExecutableDirectory() {
	string exec;
	CHECK_OK(Env::Default()->GetExecutablePath(&exec));
	return DirName(exec);
	}

	void AssertEventually(const std::function<void(void)>& f,
	const MonoDelta& timeout,
	AssertBackoff backoff) {
	const MonoTime deadline = MonoTime::Now() + timeout;
	{
	// Disable gtest's "on failure" behavior, or else the assertion failures
	// inside our attempts will cause the test to end even though we would
	// like to retry.
	bool old_break_on_failure = testing::FLAGS_gtest_break_on_failure;
	bool old_throw_on_failure = testing::FLAGS_gtest_throw_on_failure;
	auto c = MakeScopedCleanup([old_break_on_failure, old_throw_on_failure]() {
	testing::FLAGS_gtest_break_on_failure = old_break_on_failure;
	testing::FLAGS_gtest_throw_on_failure = old_throw_on_failure;
	});
	testing::FLAGS_gtest_break_on_failure = false;
	testing::FLAGS_gtest_throw_on_failure = false;

	for (int attempts = 0; MonoTime::Now() < deadline; attempts++) {
	// Capture any assertion failures within this scope (i.e. from their function)
	// into 'results'
	testing::TestPartResultArray results;
	testing::ScopedFakeTestPartResultReporter reporter(
	testing::ScopedFakeTestPartResultReporter::INTERCEPT_ONLY_CURRENT_THREAD,
	&results);
	f();

	// Determine whether their function produced any new test failure results.
	bool has_failures = false;
	for (int i = 0; i < results.size(); i++) {
	has_failures \|= results.GetTestPartResult(i).failed();
	}
	if (!has_failures) {
	return;
	}

	// If they had failures, sleep and try again.
	int sleep_ms;
	switch (backoff) {
	case AssertBackoff::EXPONENTIAL:
	sleep_ms = (attempts < 10) ? (1 << attempts) : 1000;
	break;
	case AssertBackoff::NONE:
	sleep_ms = 1;
	break;
	default:
	LOG(FATAL) << "Unknown backoff type";
	}
	SleepFor(MonoDelta::FromMilliseconds(sleep_ms));
	}
	}

	// If we ran out of time looping, run their function one more time
	// without capturing its assertions. This way the assertions will
	// propagate back out to the normal test reporter. Of course it's
	// possible that it will pass on this last attempt, but that's OK
	// too, since we aren't trying to be that strict about the deadline.
	f();
	if (testing::Test::HasFatalFailure()) {
	ADD_FAILURE() << "Timed out waiting for assertion to pass.";
	}
	}

	int CountOpenFds(Env* env, const string& path_pattern) {
	static const char* kProcSelfFd =
	#if defined(__APPLE__)
	"/dev/fd";
	#else
	"/proc/self/fd";
	#endif // defined(__APPLE__)
	faststring path_buf;
	vector<string> children;
	CHECK_OK(env->GetChildren(kProcSelfFd, &children));
	int num_fds = 0;
	for (const auto& c : children) {
	// Skip '.' and '..'.
	if (c == "." \|\| c == "..") {
	continue;
	}
	int32_t fd;
	CHECK(safe_strto32(c, &fd)) << "Unexpected file in fd list: " << c;
	#ifdef __APPLE__
	path_buf.resize(MAXPATHLEN);
	if (fcntl(fd, F_GETPATH, path_buf.data()) != 0) {
	if (errno == EBADF) {
	// The file was closed while we were looping. This is likely the
	// actual file descriptor used for opening /proc/fd itself.
	continue;
	}
	PLOG(FATAL) << "Unknown error in fcntl(F_GETPATH): " << fd;
	}
	char* buf_data = reinterpret_cast<char*>(path_buf.data());
	path_buf.resize(strlen(buf_data));
	#else
	path_buf.resize(PATH_MAX);
	char* buf_data = reinterpret_cast<char*>(path_buf.data());
	auto proc_file = JoinPathSegments(kProcSelfFd, c);
	int path_len = readlink(proc_file.c_str(), buf_data, path_buf.size());
	if (path_len < 0) {
	if (errno == ENOENT) {
	// The file was closed while we were looping. This is likely the
	// actual file descriptor used for opening /proc/fd itself.
	continue;
	}
	PLOG(FATAL) << "Unknown error in readlink: " << proc_file;
	}
	path_buf.resize(path_len);
	#endif
	if (!MatchPattern(path_buf.ToString(), path_pattern)) {
	continue;
	}
	num_fds++;
	}

	return num_fds;
	}

	namespace {
	Status WaitForBind(pid_t pid, uint16_t* port,
	const vector<string>& addresses,
	const char* kind,
	MonoDelta timeout) {
	static const vector<string> kWildcard = { "0.0.0.0" };

	// In general, processes do not expose the port they bind to, and
	// reimplementing lsof involves parsing a lot of files in /proc/. So,
	// requiring lsof for tests and parsing its output seems more
	// straight-forward. We call lsof in a loop since it typically takes a long
	// time for it to initialize and bind a port.

	string lsof;
	RETURN_NOT_OK(FindExecutable("lsof", {"/sbin", "/usr/sbin"}, &lsof));

	const vector<string> cmd = {
	lsof, "-wbnP", "-Ffn",
	"-p", std::to_string(pid),
	"-a", "-i", kind
	};

	// The '-Ffn' flag gets lsof to output something like:
	// p5801
	// f548
	// n127.0.0.1:43954->127.0.0.1:43617
	// f549
	// n*:8038
	//
	// The first line is the pid. We ignore it.
	// Subsequent lines come in pairs. In each pair, the first half of the pair
	// is file descriptor number, we ignore it.
	// The second half has the bind address and port.
	//
	// In this example, the first pair is an outbound TCP socket. We ignore it.
	// The second pair is the listening TCP socket bind address and port.
	//
	// We use the first encountered listening TCP socket, since that's most likely
	// to be the primary service port. When searching, we use the provided bind
	// address if there is any, otherwise we use '*' (same as '0.0.0.0') which
	// matches all addresses on the local machine.
	const MonoTime deadline = MonoTime::Now() + timeout;
	const auto& addresses_to_check = addresses.empty() ? kWildcard : addresses;
	for (int64_t i = 1; ; ++i) {
	for (const auto& addr : addresses_to_check) {
	string addr_pattern = Substitute("n$0:", addr == "0.0.0.0" ? "*" : addr);
	string lsof_out;
	int32_t p = -1;
	Status s = Subprocess::Call(cmd, "", &lsof_out).AndThen([&] () {
	StripTrailingNewline(&lsof_out);
	vector<string> lines = strings::Split(lsof_out, "\n");
	for (int index = 2; index < lines.size(); index += 2) {
	StringPiece cur_line(lines[index]);
	if (HasPrefixString(cur_line.ToString(), addr_pattern) &&
	!cur_line.contains("->")) {
	cur_line.remove_prefix(addr_pattern.size());
	if (!safe_strto32(cur_line.data(), cur_line.size(), &p)) {
	return Status::RuntimeError("unexpected lsof output", lsof_out);
	}

	return Status::OK();
	}
	}

	return Status::RuntimeError("unexpected lsof output", lsof_out);
	});

	if (s.ok()) {
	CHECK(p > 0 && p < std::numeric_limits<uint16_t>::max())
	<< "parsed invalid port: " << p;
	VLOG(1) << "Determined bound port: " << p;
	*port = static_cast<uint16_t>(p);

	return Status::OK();
	}
	if (deadline < MonoTime::Now()) {
	return s;
	}
	}
	SleepFor(MonoDelta::FromMilliseconds(i * 10));
	}

	// Should not reach here.
	LOG(FATAL) << "could not determine bound port the process";
	__builtin_unreachable();
	}
	} // anonymous namespace

	Status WaitForTcpBind(pid_t pid, uint16_t* port,
	const vector<string>& addresses,
	MonoDelta timeout) {
	return WaitForBind(pid, port, addresses, "4TCP", timeout);
	}

	Status WaitForUdpBind(pid_t pid, uint16_t* port,
	const vector<string>& addresses,
	MonoDelta timeout) {
	return WaitForBind(pid, port, addresses, "4UDP", timeout);
	}

	Status FindHomeDir(const string& name, const string& bin_dir, string* home_dir) {
	string name_upper;
	ToUpperCase(name, &name_upper);

	string env_var = Substitute("$0_HOME", name_upper);
	const char* env = std::getenv(env_var.c_str());
	string dir = env == nullptr ? JoinPathSegments(bin_dir, Substitute("$0-home", name)) : env;

	if (!Env::Default()->FileExists(dir)) {
	return Status::NotFound(Substitute("$0 directory does not exist", env_var), dir);
	}
	*home_dir = dir;
	return Status::OK();
	}

	} // namespace kudu