src/tests/slave_recovery_tests.cpp - mesos - Git at Google

 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #include <unistd.h>

 #include <gtest/gtest.h>

 #include <string>

 #include <mesos/executor.hpp>
 #include <mesos/resources.hpp>
 #include <mesos/scheduler.hpp>

 #include <process/dispatch.hpp>
 #include <process/gmock.hpp>

 #include <stout/none.hpp>
 #include <stout/numify.hpp>
 #include <stout/option.hpp>
 #include <stout/os.hpp>
 #include <stout/path.hpp>
 #include <stout/uuid.hpp>

 #include "common/protobuf_utils.hpp"

 #include "detector/detector.hpp"

 #ifdef __linux__
 #include "linux/cgroups.hpp"
 #endif

 #include "master/master.hpp"

 #include "slave/gc.hpp"
 #ifdef __linux__
 #include "slave/cgroups_isolator.hpp"
 #endif
 #include "slave/paths.hpp"
 #include "slave/process_isolator.hpp"
 #include "slave/reaper.hpp"
 #include "slave/slave.hpp"
 #include "slave/state.hpp"

 #include "messages/messages.hpp"

 #include "tests/mesos.hpp"
 #include "tests/utils.hpp"

 using namespace mesos;
 using namespace mesos::internal;
 using namespace mesos::internal::slave;
 using namespace mesos::internal::tests;

 using namespace process;

 using mesos::internal::master::Master;

 using mesos::internal::slave::GarbageCollectorProcess;
 #ifdef __linux__
 using mesos::internal::slave::CgroupsIsolator;
 #endif
 using mesos::internal::slave::ProcessIsolator;

 using std::map;
 using std::string;
 using std::vector;

 using testing::_;
 using testing::AtMost;
 using testing::Eq;
 using testing::Return;
 using testing::SaveArg;


 class SlaveStateTest : public TemporaryDirectoryTest {};


 TEST_F(SlaveStateTest, CheckpointProtobuf)
 {
   // Checkpoint slave id.
   SlaveID expected;
   expected.set_value("slave1");

   const string& file = "slave.id";
   state::checkpoint(file, expected);

   const Result<SlaveID>& actual = ::protobuf::read<SlaveID>(file);
   ASSERT_SOME(actual);

   ASSERT_SOME_EQ(expected, actual);
 }


 TEST_F(SlaveStateTest, CheckpointString)
 {
   // Checkpoint a test string.
   const string expected = "test";
   const string file = "test-file";
   state::checkpoint(file, expected);

   ASSERT_SOME_EQ(expected, os::read(file));
 }


 template <typename T>
 class SlaveRecoveryTest : public IsolatorTest<T>
 {
 public:
   virtual slave::Flags CreateSlaveFlags()
   {
     slave::Flags flags = IsolatorTest<T>::CreateSlaveFlags();

     // Setup recovery slave flags.
     flags.checkpoint = true;
     flags.recover = "reconnect";
     flags.strict = true;

     return flags;
   }
 };


 #ifdef __linux__
 typedef ::testing::Types<ProcessIsolator, CgroupsIsolator> IsolatorTypes;
 #else
 typedef ::testing::Types<ProcessIsolator> IsolatorTypes;
 #endif

 TYPED_TEST_CASE(SlaveRecoveryTest, IsolatorTypes);


 // Enable checkpointing on the slave and ensure recovery works.
 TYPED_TEST(SlaveRecoveryTest, RecoverSlaveState)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   FrameworkID frameworkId;
   EXPECT_CALL(sched, registered(_, _, _))
     .WillOnce(SaveArg<1>(&frameworkId));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   Future<Message> registerFrameworkMessage =
     FUTURE_MESSAGE(Eq(RegisterFrameworkMessage().GetTypeName()), _, _);

   driver.start();

   // Capture the framework pid.
   AWAIT_READY(registerFrameworkMessage);
   UPID frameworkPid = registerFrameworkMessage.get().from;

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   SlaveID slaveId = offers.get()[0].slave_id();

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   // Scheduler expectations.
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillRepeatedly(Return());

   // Message expectations.
   Future<Message> registerExecutorMessage =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   Future<StatusUpdateMessage> update =
     FUTURE_PROTOBUF(StatusUpdateMessage(), Eq(master.get()), _);

   Future<StatusUpdateAcknowledgementMessage> ack =
     FUTURE_PROTOBUF(StatusUpdateAcknowledgementMessage(), _, _);

   Future<Nothing> _ack =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Capture the executor pids.
   AWAIT_READY(registerExecutorMessage);
   RegisterExecutorMessage registerExecutor;
   registerExecutor.ParseFromString(registerExecutorMessage.get().body);
   ExecutorID executorId = registerExecutor.executor_id();
   UPID libprocessPid = registerExecutorMessage.get().from;

   // Capture the update.
   AWAIT_READY(update);
   EXPECT_EQ(TASK_RUNNING, update.get().update().status().state());

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_ack);

   // Recover the state.
   Result<state::SlaveState> recover = state::recover(
       paths::getMetaRootDir(flags.work_dir), true);

   ASSERT_SOME(recover);

   state::SlaveState state = recover.get();

   // Check slave id.
   ASSERT_EQ(slaveId, state.id);

   // Check framework id and pid.
   ASSERT_TRUE(state.frameworks.contains(frameworkId));
   ASSERT_SOME_EQ(frameworkPid, state.frameworks[frameworkId].pid);

   ASSERT_TRUE(state.frameworks[frameworkId].executors.contains(executorId));

   // Check executor id and pids.
   const Option<UUID>& uuid=
       state.frameworks[frameworkId].executors[executorId].latest;
   ASSERT_SOME(uuid);

   ASSERT_TRUE(state
                 .frameworks[frameworkId]
                 .executors[executorId]
                 .runs.contains(uuid.get()));

   ASSERT_SOME_EQ(
       libprocessPid,
       state
         .frameworks[frameworkId]
         .executors[executorId]
         .runs[uuid.get()]
         .libprocessPid);


   // Check task id and info.
   ASSERT_TRUE(state
                 .frameworks[frameworkId]
                 .executors[executorId]
                 .runs[uuid.get()]
                 .tasks.contains(task.task_id()));

   const Task& t = mesos::internal::protobuf::createTask(
       task, TASK_STAGING, executorId, frameworkId);

   ASSERT_SOME_EQ(
       t,
       state
         .frameworks[frameworkId]
         .executors[executorId]
         .runs[uuid.get()]
         .tasks[task.task_id()]
         .info);

   // Check status update and ack.
   ASSERT_EQ(
       1U,
       state
         .frameworks[frameworkId]
         .executors[executorId]
         .runs[uuid.get()]
         .tasks[task.task_id()]
         .updates.size());

   ASSERT_EQ(
       update.get().update().uuid(),
       state
         .frameworks[frameworkId]
         .executors[executorId]
         .runs[uuid.get()]
         .tasks[task.task_id()]
         .updates.front().uuid());

   ASSERT_TRUE(state
                 .frameworks[frameworkId]
                 .executors[executorId]
                 .runs[uuid.get()]
                 .tasks[task.task_id()]
                 .acks.contains(UUID::fromBytes(ack.get().uuid())));

   // Shut down the executor manually so that it doesn't hang around
   // after the test finishes.
   process::post(libprocessPid, ShutdownExecutorMessage());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is killed before the update reaches the scheduler.
 // When the slave comes back up it resends the unacknowledged update.
 TYPED_TEST(SlaveRecoveryTest, RecoverStatusUpdateManager)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   // Message expectations.
   Future<Message> registerExecutor =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   // Drop the first update from the executor.
   Future<StatusUpdateMessage> update =
     DROP_PROTOBUF(StatusUpdateMessage(), _, _);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Capture the executor pid.
   AWAIT_READY(registerExecutor);
   UPID executorPid = registerExecutor.get().from;

   // Wait for the status update drop.
   AWAIT_READY(update);

   this->Stop(slave.get());

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());       // Ignore subsequent updates.

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(status);
   ASSERT_EQ(TASK_RUNNING, status.get().state());

   // Shut down the executor manually so that it doesn't hang around
   // after the test finishes.
   // TODO(vinod): Kill this after the fix to 'Cluster' to properly
   // shutdown the slaves.
   process::post(executorPid, ShutdownExecutorMessage());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped before the first update for a task is received
 // from the executor. When it comes back up with recovery=reconnect, make
 // sure the executor re-registers and the slave properly sends the update.
 TYPED_TEST(SlaveRecoveryTest, ReconnectExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   // Drop the first update from the executor.
   Future<StatusUpdateMessage> statusUpdate =
     DROP_PROTOBUF(StatusUpdateMessage(), _, _);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Stop the slave before the status update is received.
   AWAIT_READY(statusUpdate);

   this->Stop(slave.get());

   Future<Message> reregisterExecutorMessage =
     FUTURE_MESSAGE(Eq(ReregisterExecutorMessage().GetTypeName()), _, _);

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());       // Ignore subsequent updates.

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   // Ensure the executor re-registers.
   AWAIT_READY(reregisterExecutorMessage);
   UPID executorPid = reregisterExecutorMessage.get().from;

   ReregisterExecutorMessage reregister;
   reregister.ParseFromString(reregisterExecutorMessage.get().body);

   // Executor should inform about the unacknowledged update.
   ASSERT_EQ(1, reregister.updates_size());
   const StatusUpdate& update = reregister.updates(0);
   ASSERT_EQ(task.task_id(), update.status().task_id());
   ASSERT_EQ(TASK_RUNNING, update.status().state());

   // Scheduler should receive the recovered update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_RUNNING, status.get().state());

   // Shut down the executor manually so that it doesn't hang around
   // after the test finishes.
   // TODO(vinod): Kill this after the fix to 'Cluster' to properly
   // shutdown the slaves.
   process::post(executorPid, ShutdownExecutorMessage());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped before the (command) executor is registered.
 // When it comes back up with recovery=reconnect, make sure the
 // executor is killed and the task is transitioned to FAILED.
 TYPED_TEST(SlaveRecoveryTest, RecoverUnregisteredExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   // Drop the executor registration message.
   Future<Message> registerExecutor =
     DROP_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Stop the slave before the executor is registered.
   AWAIT_READY(registerExecutor);
   UPID executorPid = registerExecutor.get().from;

   this->Stop(slave.get());

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());       // Ignore subsequent updates.

   Future<Nothing> recover = FUTURE_DISPATCH(_, &Slave::_recover);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Now advance time until the reaper reaps the executor.
   while (status.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   // Scheduler should receive the TASK_FAILED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_FAILED, status.get().state());

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped after a non-terminal update is received.
 // The command executor terminates when the slave is down.
 // When it comes back up with recovery=reconnect, make
 // sure the task is properly transitioned to FAILED.
 TYPED_TEST(SlaveRecoveryTest, RecoverTerminatedExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   Future<Message> registerExecutor =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> ack =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Capture the executor pid.
   AWAIT_READY(registerExecutor);
   UPID executorPid = registerExecutor.get().from;

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(ack);

   this->Stop(slave.get());

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status));

   // Now shut down the executor, when the slave is down.
   process::post(executorPid, ShutdownExecutorMessage());

   Future<Nothing> recover = FUTURE_DISPATCH(_, &Slave::_recover);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Now advance time until the reaper reaps the executor.
   while (status.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   // Scheduler should receive the TASK_FAILED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_FAILED, status.get().state());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped after a non-terminal update is received.
 // The command executor is expected to self-terminate while the slave
 // is down, because the recovery timeout elapses.
 // When the slave comes back up with recovery=reconnect, make
 // sure the task is properly transitioned to FAILED.
 TYPED_TEST(SlaveRecoveryTest, RecoveryTimeout)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   // Set a short recovery timeout, as we can't control the executor
   // driver time when using the process / cgroups isolators.
   slave::Flags flags = this->CreateSlaveFlags();
   flags.recovery_timeout = Milliseconds(1);

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement);

   this->Stop(slave.get());

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status));

   // Ensure the executor terminates by causing the recovery timeout
   // to elapse while disconnected from the slave.
   os::sleep(Milliseconds(1));

   Future<Nothing> _recover = FUTURE_DISPATCH(_, &Slave::_recover);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(_recover);

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);
   Clock::settle();

   Clock::resume();

   // Scheduler should receive the TASK_FAILED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_FAILED, status.get().state());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped after an executor is completed (i.e., it has
 // terminated and all its updates have been acknowledged).
 // When it comes back up with recovery=reconnect, make
 // sure the recovery successfully completes.
 TYPED_TEST(SlaveRecoveryTest, RecoverCompletedExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "exit 0");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Short-lived task.

   EXPECT_CALL(sched, statusUpdate(_, _))
     .Times(2); // TASK_RUNNING and TASK_FINISHED updates.

   EXPECT_CALL(sched, offerRescinded(_, _))
     .Times(AtMost(1));

   Future<Nothing> schedule = FUTURE_DISPATCH(
       _, &GarbageCollectorProcess::schedule);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // We use 'gc.schedule' as a proxy for the cleanup of the executor.
   AWAIT_READY(schedule);

   this->Stop(slave.get());

   Future<Nothing> schedule2 = FUTURE_DISPATCH(
       _, &GarbageCollectorProcess::schedule);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   // We use 'gc.schedule' as a proxy for the cleanup of the executor.
   AWAIT_READY(schedule2);

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is stopped after a non-terminal update is received.
 // Slave is restarted in recovery=cleanup mode. It kills the command
 // executor, and transitions the task to FAILED.
 TYPED_TEST(SlaveRecoveryTest, CleanupExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers));

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> ack =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(ack);

   this->Stop(slave.get());

   // Slave in cleanup mode shouldn't reregister with slave and hence
   // no offers should be made by the master.
   EXPECT_CALL(sched, resourceOffers(_, _))
     .Times(0);

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status));

   Future<Nothing> _initialize = FUTURE_DISPATCH(_, &Slave::_initialize);

   // Restart the slave in 'cleanup' recovery mode with a new isolator.
   TypeParam isolator2;

   flags.recover = "cleanup";

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   // Now advance time until the reaper reaps the executor.
   while (status.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   // Scheduler should receive the TASK_FAILED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_FAILED, status.get().state());

   // Wait for recovery to complete.
   AWAIT_READY(_initialize);
   Clock::settle();

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test checks whether a non-checkpointing framework is
 // properly removed, when a checkpointing slave is disconnected.
 TYPED_TEST(SlaveRecoveryTest, RemoveNonCheckpointingFramework)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator;

   Try<PID<Slave> > slave = this->StartSlave(&isolator);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Disable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(false);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   // Launch 2 tasks from this offer.
   vector<TaskInfo> tasks;
   Offer offer = offers.get()[0];

   Offer offer1 = offer;
   offer1.mutable_resources()->CopyFrom(Resources::parse("cpus:1;mem:512").get());
   tasks.push_back(createTask(offer1, "sleep 1000")); // Long-running task

   Offer offer2 = offer;
   offer2.mutable_resources()->CopyFrom(Resources::parse("cpus:1;mem:512").get());
   tasks.push_back(createTask(offer2, "sleep 1000")); // Long-running task

   ASSERT_LE(Resources(offer1.resources()) + Resources(offer2.resources()),
             Resources(offer.resources()));

   Future<Nothing> update1;
   Future<Nothing> update2;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureSatisfy(&update1))
     .WillOnce(FutureSatisfy(&update2));

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for TASK_RUNNING updates from the tasks.
   AWAIT_READY(update1);
   AWAIT_READY(update2);

   // The master should generate TASK_LOST updates once the slave is stopped.
   Future<TaskStatus> status1;
   Future<TaskStatus> status2;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status1))
     .WillOnce(FutureArg<1>(&status2));

   this->Stop(slave.get());

   // Scheduler should receive the TASK_LOST updates.
   AWAIT_READY(status1);
   ASSERT_EQ(TASK_LOST, status1.get().state());

   AWAIT_READY(status2);
   ASSERT_EQ(TASK_LOST, status2.get().state());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test ensures that no checkpointing happens for a
 // framework that has disabled checkpointing.
 TYPED_TEST(SlaveRecoveryTest, NonCheckpointingFramework)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Disable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(false);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   FrameworkID frameworkId;
   EXPECT_CALL(sched, registered(_, _, _))
     .WillOnce(SaveArg<1>(&frameworkId));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());      // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   Future<Nothing> update;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureSatisfy(&update))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for TASK_RUNNING update.
   AWAIT_READY(update);

   Clock::pause();

   Future<Nothing> updateFramework = FUTURE_DISPATCH(_, &Slave::updateFramework);

   // Simulate a 'UpdateFrameworkMessage' to ensure framework pid is
   // not being checkpointed.
   process::dispatch(slave.get(), &Slave::updateFramework, frameworkId, "");

   AWAIT_READY(updateFramework);

   Clock::settle(); // Wait for the slave to act on the dispatch.

   // Ensure that the framework info is not being checkpointed.
   const string& path = paths::getFrameworkPath(
       paths::getMetaRootDir(flags.work_dir),
       task.slave_id(),
       frameworkId);

   ASSERT_FALSE(os::exists(path));

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test ensures that a non-checkpointing slave's resources are not offered
 // to a framework that requires checkpointing.
 TYPED_TEST(SlaveRecoveryTest, NonCheckpointingSlave)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator;

   // Disable checkpointing for the slave.
   slave::Flags flags = this->CreateSlaveFlags();
   flags.checkpoint = false;

   Clock::pause();

   Future<RegisterSlaveMessage> registerSlaveMessage =
     FUTURE_PROTOBUF(RegisterSlaveMessage(), _, _);

   Try<PID<Slave> > slave = this->StartSlave(&isolator, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(registerSlaveMessage);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   Future<Nothing> registered;
   EXPECT_CALL(sched, registered(_, _, _))
     .WillOnce(FutureSatisfy(&registered));

   EXPECT_CALL(sched, resourceOffers(_, _))
     .Times(0); // No offers should be received!

   driver.start();

   // Wait for scheduler to register. We do a Clock::settle() here
   // to ensure that no offers are received by the scheduler.
   AWAIT_READY(registered);
   Clock::settle();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // Scheduler asks a restarted slave to kill a task that has been
 // running before the slave restarted. This test ensures that a
 // restarted slave is able to communicate with all components
 // (scheduler, master, executor).
 TYPED_TEST(SlaveRecoveryTest, KillTask)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers1));

   driver.start();

   AWAIT_READY(offers1);
   EXPECT_NE(0u, offers1.get().size());

   TaskInfo task = createTask(offers1.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> ack =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers1.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(ack);

   this->Stop(slave.get());

   Future<Nothing> recover = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlave =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Wait for the slave to re-register.
   AWAIT_READY(reregisterSlave);

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers2))
     .WillRepeatedly(Return());        // Ignore subsequent offers.

   // Kill the task.
   driver.killTask(task.task_id());

   // Wait for TASK_KILLED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_KILLED, status.get().state());

   // Advance the clock until the allocator allocates
   // the recovered resources.
   while (offers2.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   // Make sure all slave resources are reoffered.
   AWAIT_READY(offers2);
   ASSERT_EQ(Resources(offers1.get()[0].resources()),
             Resources(offers2.get()[0].resources()));

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // When the slave is down we remove the "latest" symlink in the
 // executor's run directory, to simulate a situation where the
 // recovered slave (--no-strict) cannot recover the executor and
 // hence schedules it for gc.
 TYPED_TEST(SlaveRecoveryTest, GCExecutor)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();
   flags.strict = false;

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return()); // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   // Capture the slave and framework ids.
   SlaveID slaveId = offers.get()[0].slave_id();
   FrameworkID frameworkId = offers.get()[0].framework_id();

   Future<Message> registerExecutorMessage =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   Future<Nothing> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureSatisfy(&status))
     .WillRepeatedly(Return()); // Ignore subsequent updates.

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Capture the executor id and pid.
   AWAIT_READY(registerExecutorMessage);
   RegisterExecutorMessage registerExecutor;
   registerExecutor.ParseFromString(registerExecutorMessage.get().body);
   ExecutorID executorId = registerExecutor.executor_id();
   UPID executorPid = registerExecutorMessage.get().from;

   // Wait for TASK_RUNNING update.
   AWAIT_READY(status);

   this->Stop(slave.get());

   // Shut down the executor manually so that it doesn't hang around
   // after the test finishes.
   process::post(executorPid, ShutdownExecutorMessage());

   // Remove the symlink "latest" in the executor directory
   // to simulate a non-recoverable executor.
   ASSERT_SOME(os::rm(paths::getExecutorLatestRunPath(
       paths::getMetaRootDir(flags.work_dir),
       slaveId,
       frameworkId,
       executorId)));

   Future<Nothing> recover = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlave =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   Clock::settle();

   AWAIT_READY(reregisterSlave);

   Clock::advance(flags.gc_delay);

   Clock::settle();

   // Executor's work and meta directories should be gc'ed by now.
   ASSERT_FALSE(os::exists(paths::getExecutorPath(
       flags.work_dir, slaveId, frameworkId, executorId)));

   ASSERT_FALSE(os::exists(paths::getExecutorPath(
       paths::getMetaRootDir(flags.work_dir),
       slaveId,
       frameworkId,
       executorId)));

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The slave is asked to shutdown. When it comes back up, it should
 // register as a new slave.
 TYPED_TEST(SlaveRecoveryTest, ShutdownSlave)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers1))
     .WillOnce(Return());       // Ignore the offer when slave is shutting down.

   driver.start();

   AWAIT_READY(offers1);

   EXPECT_NE(0u, offers1.get().size());

   TaskInfo task = createTask(offers1.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task.

   Future<Nothing> statusUpdate1;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureSatisfy(&statusUpdate1))
     .WillOnce(Return());  // Ignore TASK_FAILED update.

   Future<Message> registerExecutor =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   driver.launchTasks(offers1.get()[0].id(), tasks);

   // Capture the executor pid.
   AWAIT_READY(registerExecutor);
   UPID executorPid = registerExecutor.get().from;

   AWAIT_READY(statusUpdate1); // Wait for TASK_RUNNING update.

   EXPECT_CALL(sched, offerRescinded(_, _))
     .Times(AtMost(1));

   Future<Nothing> executorTerminated =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);

   // We shut down the executor here so that a shutting down slave
   // does not spend too much time waiting for the executor to exit.
   process::post(executorPid, ShutdownExecutorMessage());

   Clock::pause();

   // Now advance time until the reaper reaps the executor.
   while (executorTerminated.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   AWAIT_READY(executorTerminated);

   Clock::resume();

   this->Stop(slave.get(), true); // Send a "shut down".

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers2))
     .WillRepeatedly(Return());        // Ignore subsequent offers.

   // Now restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   // Ensure that the slave registered with a new id.
   AWAIT_READY(offers2);

   EXPECT_NE(0u, offers2.get().size());

   // Ensure the slave id is different.
   ASSERT_NE(
       offers1.get()[0].slave_id().value(), offers2.get()[0].slave_id().value());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The checkpointing slave fails to do recovery and tries to register
 // as a new slave. The master should give it a new id and transition
 // all the tasks of the old slave to LOST.
 TYPED_TEST(SlaveRecoveryTest, RegisterDisconnectedSlave)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   Future<RegisterSlaveMessage> registerSlaveMessage =
     FUTURE_PROTOBUF(RegisterSlaveMessage(), _, _);

   TypeParam isolator;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(registerSlaveMessage);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return()); // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   // Capture the slave and framework ids.
   SlaveID slaveId = offers.get()[0].slave_id();
   FrameworkID frameworkId = offers.get()[0].framework_id();

   Future<Message> registerExecutorMessage =
     FUTURE_MESSAGE(Eq(RegisterExecutorMessage().GetTypeName()), _, _);

   Future<Nothing> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureSatisfy(&status));

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Capture the executor pid.
   AWAIT_READY(registerExecutorMessage);
   RegisterExecutorMessage registerExecutor;
   registerExecutor.ParseFromString(registerExecutorMessage.get().body);
   UPID executorPid = registerExecutorMessage.get().from;

   // Wait for TASK_RUNNING update.
   AWAIT_READY(status);

   EXPECT_CALL(sched, slaveLost(_, _))
     .Times(AtMost(1));

   this->Stop(slave.get());

   // Shut down the executor manually so that it doesn't hang around
   // after the test finishes.
   process::post(executorPid, ShutdownExecutorMessage());

   Future<TaskStatus> status2;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status2));

   // Spoof the registration attempt of a checkpointing slave
   // that failed recovery. We do this because simply restarting
   // the slave will result in a slave with a different pid than
   // the previous one.
   post(slave.get(), master.get(), registerSlaveMessage.get());

   // Scheduler should get a TASK_LOST message.
   AWAIT_READY(status2);
   ASSERT_EQ(TASK_LOST, status2.get().state());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test verifies that a KillTask message received by the
 // master when a checkpointing slave is disconnected is properly
 // reconciled when the slave reregisters.
 TYPED_TEST(SlaveRecoveryTest, ReconcileKillTask)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   Future<RegisterSlaveMessage> registerSlaveMessage =
       FUTURE_PROTOBUF(RegisterSlaveMessage(), _, _);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(registerSlaveMessage);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return()); // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   // Capture the slave and framework ids.
   SlaveID slaveId = offers.get()[0].slave_id();
   FrameworkID frameworkId = offers.get()[0].framework_id();

   EXPECT_CALL(sched, statusUpdate(_, _)); // TASK_RUNNING

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for TASK_RUNNING update to be acknowledged.
   AWAIT_READY(_statusUpdateAcknowledgement);

   this->Stop(slave.get());

   // Now send a KillTask message to the master. This will not be
   // received by the slave because it is down.
   driver.killTask(task.task_id());

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status));

   // Now restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   // Scheduler should get a TASK_KILLED message.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_KILLED, status.get().state());

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test verifies that when the slave recovers and re-registers
 // with a framework that was shutdown when the slave was down, it gets
 // a ShutdownFramework message.
 TYPED_TEST(SlaveRecoveryTest, ReconcileShutdownFramework)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   Future<RegisterSlaveMessage> registerSlaveMessage =
     FUTURE_PROTOBUF(RegisterSlaveMessage(), _, _);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(registerSlaveMessage);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return()); // Ignore subsequent offers.

   driver.start();

   AWAIT_READY(offers);
   EXPECT_NE(0u, offers.get().size());

   // Capture the slave and framework ids.
   SlaveID slaveId = offers.get()[0].slave_id();
   FrameworkID frameworkId = offers.get()[0].framework_id();

   EXPECT_CALL(sched, statusUpdate(_, _)); // TASK_RUNNING

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for TASK_RUNNING update to be acknowledged.
   AWAIT_READY(_statusUpdateAcknowledgement);

   this->Stop(slave.get());

   Future<UnregisterFrameworkMessage> unregisterFrameworkMessage =
     FUTURE_PROTOBUF(UnregisterFrameworkMessage(), _, _);

   // Now stop the framework.
   driver.stop();
   driver.join();

   // Wait util the framework is removed.
   AWAIT_READY(unregisterFrameworkMessage);

   Future<ShutdownFrameworkMessage> shutdownFrameworkMessage =
     FUTURE_PROTOBUF(ShutdownFrameworkMessage(), _, _);

   Future<Nothing> executorTerminated =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);

   // Now restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   // Slave should get a ShutdownFrameworkMessage.
   AWAIT_READY(shutdownFrameworkMessage);

   // Ensure that the executor is terminated.
   AWAIT_READY(executorTerminated);

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }

 // Scheduler asks a restarted slave to kill a task that has been
 // running before the slave restarted. A scheduler failover happens
 // when the slave is down. This test verifies that a scheduler
 // failover will not affect the slave recovery process.
 TYPED_TEST(SlaveRecoveryTest, SchedulerFailover)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;
   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   // Launch the first (i.e., failing) scheduler.
   MockScheduler sched1;

   FrameworkInfo framework1;
   framework1.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   framework1.set_checkpoint(true);

   MesosSchedulerDriver driver1(&sched1, framework1, master.get());

   Future<FrameworkID> frameworkId;
   EXPECT_CALL(sched1, registered(&driver1, _, _))
     .WillOnce(FutureArg<1>(&frameworkId));

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched1, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers1));

   driver1.start();

   AWAIT_READY(frameworkId);
   AWAIT_READY(offers1);
   EXPECT_NE(0u, offers1.get().size());

   // Create a long running task.
   TaskInfo task = createTask(offers1.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task);

   EXPECT_CALL(sched1, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver1.launchTasks(offers1.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement);

   this->Stop(slave.get());

   // Now launch the second (i.e., failover) scheduler using the
   // framework id recorded from the first scheduler.
   MockScheduler sched2;

   FrameworkInfo framework2;
   framework2.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   framework2.mutable_id()->MergeFrom(frameworkId.get());
   framework2.set_checkpoint(true);

   MesosSchedulerDriver driver2(&sched2, framework2, master.get());

   Future<Nothing> sched2Registered;
   EXPECT_CALL(sched2, registered(&driver2, frameworkId.get(), _))
     .WillOnce(FutureSatisfy(&sched2Registered));

   Future<Nothing> sched1Error;
   EXPECT_CALL(sched1, error(&driver1, "Framework failed over"))
     .WillOnce(FutureSatisfy(&sched1Error));

   driver2.start();

   AWAIT_READY(sched2Registered);
   AWAIT_READY(sched1Error);

   Future<Nothing> _recover = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlaveMessage =
       FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(_recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Wait for the slave to re-register.
   AWAIT_READY(reregisterSlaveMessage);

   Future<TaskStatus> status;
   EXPECT_CALL(sched2, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched2, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers2))
     .WillRepeatedly(Return());        // Ignore subsequent offers.

    // Kill the task.
   driver2.killTask(task.task_id());

   // Wait for TASK_KILLED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_KILLED, status.get().state());

   // Advance the clock until the allocator allocates
   // the recovered resources.
   while (offers2.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   // Make sure all slave resources are reoffered.
   AWAIT_READY(offers2);
   ASSERT_EQ(Resources(offers1.get()[0].resources()),
             Resources(offers2.get()[0].resources()));

   Clock::resume();

   driver2.stop();
   driver2.join();

   driver1.stop();
   driver1.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // The purpose of this test is to ensure that during a network
 // partition, the master will remove a partitioned slave. When the
 // partition is removed, the slave will receive a ShutdownMessage.
 // When the slave starts again on the same host, we verify that the
 // slave will not try to reregister itself with the master. It will
 // register itself with the master and get a new slave id.
 TYPED_TEST(SlaveRecoveryTest, PartitionedSlave)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   // Set these expectations up before we spawn the slave so that we
   // don't miss the first PING.
   Future<Message> ping = FUTURE_MESSAGE(Eq("PING"), _, _);

   // Drop all the PONGs to simulate slave partition.
   DROP_MESSAGES(Eq("PONG"), _, _);

   TypeParam isolator1;
   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MockScheduler sched;
   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillOnce(FutureArg<1>(&offers))
     .WillRepeatedly(Return());

   driver.start();

   AWAIT_READY(offers);
   ASSERT_NE(0u, offers.get().size());

   // Long running task.
   TaskInfo task = createTask(offers.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task);

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement);

   Future<ShutdownMessage> shutdownMessage =
     FUTURE_PROTOBUF(ShutdownMessage(), _, slave.get());

   Future<Nothing> slaveLost;
   EXPECT_CALL(sched, slaveLost(&driver, _))
     .WillOnce(FutureSatisfy(&slaveLost));

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(&driver, _))
     .WillOnce(FutureArg<1>(&status));

   Future<Nothing> executorTerminated =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);

   Clock::pause();

   // Now, induce a partition of the slave by having the master
   // timeout the slave.
   uint32_t pings = 0;
   while (true) {
     AWAIT_READY(ping);
     pings++;
     if (pings == master::MAX_SLAVE_PING_TIMEOUTS) {
      break;
     }
     ping = FUTURE_MESSAGE(Eq("PING"), _, _);
     Clock::advance(master::SLAVE_PING_TIMEOUT);
     Clock::settle();
   }

   Clock::advance(master::SLAVE_PING_TIMEOUT);
   Clock::settle();

   // The master will notify the framework that the slave was lost.
   AWAIT_READY(slaveLost);

   // The master will have notified the framework of the lost task.
   AWAIT_READY(status);
   EXPECT_EQ(TASK_LOST, status.get().state());

   // Wait for the master to attempt to shut down the slave.
   AWAIT_READY(shutdownMessage);

   // Wait for the executor to be terminated.
   while (executorTerminated.isPending()) {
     Clock::advance(Seconds(1));
     Clock::settle();
   }

   AWAIT_READY(executorTerminated);
   Clock::settle();

   this->Stop(slave.get());

   Future<RegisterSlaveMessage> registerSlaveMessage =
     FUTURE_PROTOBUF(RegisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   AWAIT_READY(registerSlaveMessage);

   Clock::resume();

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // This test verifies that if the master changes when the slave is
 // down, the slave can still recover the task when it restarts. We
 // verify its correctness by killing the task from the scheduler.
 TYPED_TEST(SlaveRecoveryTest, MasterFailover)
 {
   // Step 1. Run a task.
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   MockScheduler sched;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers1));

   Future<process::Message> frameworkRegisteredMessage =
     FUTURE_MESSAGE(Eq(FrameworkRegisteredMessage().GetTypeName()), _, _);

   driver.start();

   AWAIT_READY(frameworkRegisteredMessage);
   AWAIT_READY(offers1);
   EXPECT_NE(0u, offers1.get().size());

   TaskInfo task = createTask(offers1.get()[0], "sleep 1000");
   vector<TaskInfo> tasks;
   tasks.push_back(task); // Long-running task

   EXPECT_CALL(sched, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers1.get()[0].id(), tasks);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement);

   this->Stop(slave.get());

   // Step 2. Simulate failed over master by restarting the master.
   this->Stop(master.get());
   master = this->StartMaster();
   ASSERT_SOME(master);

   Future<Nothing> registered;
   EXPECT_CALL(sched, registered(&driver, _, _))
     .WillOnce(FutureSatisfy(&registered));

   // Simulate a new master detected message to the scheduler.
   NewMasterDetectedMessage newMasterDetectedMsg;
   newMasterDetectedMsg.set_pid(master.get());

   process::post(frameworkRegisteredMessage.get().to, newMasterDetectedMsg);

   // Framework should get a registered callback.
   AWAIT_READY(registered);

   // Step 3. Restart the slave and kill the task.
   Future<Nothing> _recover = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlaveMessage =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(_recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Wait for the slave to re-register.
   AWAIT_READY(reregisterSlaveMessage);

   Clock::resume();

   Future<TaskStatus> status;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers2))
     .WillRepeatedly(Return());        // Ignore subsequent offers.

   // Wait for the executor to terminate before shutting down the
   // slave in order to give cgroups (if applicable) time to clean up.
   Future<Nothing> executorTerminated =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);

   // Kill the task.
   driver.killTask(task.task_id());

   // Wait for TASK_KILLED update.
   AWAIT_READY(status);
   ASSERT_EQ(TASK_KILLED, status.get().state());

   // Make sure all slave resources are reoffered.
   AWAIT_READY(offers2);
   ASSERT_EQ(Resources(offers1.get()[0].resources()),
             Resources(offers2.get()[0].resources()));

   AWAIT_READY(executorTerminated);

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // In this test there are two frameworks and one slave. Each
 // framework launches a task before the slave goes down. We verify
 // that the two frameworks and their tasks are recovered after the
 // slave restarts.
 TYPED_TEST(SlaveRecoveryTest, MultipleFrameworks)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   TypeParam isolator1;

   slave::Flags flags = this->CreateSlaveFlags();

   Try<PID<Slave> > slave = this->StartSlave(&isolator1, flags);
   ASSERT_SOME(slave);

   // Framework 1.
   MockScheduler sched1;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo1;
   frameworkInfo1.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo1.set_checkpoint(true);

   MesosSchedulerDriver driver1(&sched1, frameworkInfo1, master.get());

   EXPECT_CALL(sched1, registered(_, _, _));

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched1, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers1));

   driver1.start();

   AWAIT_READY(offers1);
   EXPECT_NE(0u, offers1.get().size());

   // Use part of the resources in the offer so that the rest can be
   // offered to framework 2.
   Offer offer1 = offers1.get()[0];
   offer1.mutable_resources()->CopyFrom(
       Resources::parse("cpus:1;mem:512").get());

   // Framework 1 launches a task.
   TaskInfo task1 = createTask(offer1, "sleep 1000");
   vector<TaskInfo> tasks1;
   tasks1.push_back(task1); // Long-running task

   EXPECT_CALL(sched1, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement1 =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);

   driver1.launchTasks(offer1.id(), tasks1);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement1);

   // Framework 2.
   MockScheduler sched2;

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo2;
   frameworkInfo2.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo2.set_checkpoint(true);

   MesosSchedulerDriver driver2(&sched2, frameworkInfo2, master.get());

   EXPECT_CALL(sched2, registered(_, _, _));

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched2, resourceOffers(_, _))
     .WillOnce(FutureArg<1>(&offers2));

   driver2.start();

   AWAIT_READY(offers2);
   EXPECT_NE(0u, offers2.get().size());

   // Framework 2 launches a task.
   TaskInfo task2 = createTask(offers2.get()[0], "sleep 1000");

   vector<TaskInfo> tasks2;
   tasks2.push_back(task2); // Long-running task

   EXPECT_CALL(sched2, statusUpdate(_, _));

   Future<Nothing> _statusUpdateAcknowledgement2 =
     FUTURE_DISPATCH(_, &Slave::_statusUpdateAcknowledgement);
   driver2.launchTasks(offers2.get()[0].id(), tasks2);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement2);

   this->Stop(slave.get());

   Future<Nothing> _recover = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlaveMessage =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart the slave (use same flags) with a new isolator.
   TypeParam isolator2;

   slave = this->StartSlave(&isolator2, flags);
   ASSERT_SOME(slave);

   Clock::pause();

   AWAIT_READY(_recover);

   Clock::settle(); // Wait for slave to schedule reregister timeout.

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Wait for the slave to re-register.
   AWAIT_READY(reregisterSlaveMessage);

   Clock::resume();

   // Expectations for the status changes as a result of killing the
   // tasks.
   Future<TaskStatus> status1;
   EXPECT_CALL(sched1, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status1))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   Future<TaskStatus> status2;
   EXPECT_CALL(sched2, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status2))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   // Kill task 1.
   driver1.killTask(task1.task_id());

   // Wait for TASK_KILLED update.
   AWAIT_READY(status1);
   ASSERT_EQ(TASK_KILLED, status1.get().state());

   // Kill task 2.
   driver2.killTask(task2.task_id());

   // Wait for TASK_KILLED update.
   AWAIT_READY(status2);
   ASSERT_EQ(TASK_KILLED, status2.get().state());

   driver1.stop();
   driver1.join();
   driver2.stop();
   driver2.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }


 // Create a test fixture for those slave recovery tests that only work
 // when ProcessIsolator is used.
 // TODO(jieyu): We use typed test here because it magically allows us
 // to access protected members in Slave (e.g. Slave::_recover).
 template <typename T>
 class SlaveRecoveryProcessIsolatorTest : public IsolatorTest<T>
 {
 public:
   virtual slave::Flags CreateSlaveFlags()
   {
     slave::Flags flags = IsolatorTest<T>::CreateSlaveFlags();

     // Setup recovery slave flags.
     flags.checkpoint = true;
     flags.recover = "reconnect";
     flags.strict = true;

     return flags;
   }
 };


 TYPED_TEST_CASE(SlaveRecoveryProcessIsolatorTest,
                 ::testing::Types<ProcessIsolator>);


 // This test verifies that slave recovery works properly even if
 // multiple slaves are co-located on the same host.
 TYPED_TEST(SlaveRecoveryProcessIsolatorTest, MultipleSlaves)
 {
   Try<PID<Master> > master = this->StartMaster();
   ASSERT_SOME(master);

   // Enable checkpointing for the framework.
   FrameworkInfo frameworkInfo;
   frameworkInfo.CopyFrom(DEFAULT_FRAMEWORK_INFO);
   frameworkInfo.set_checkpoint(true);

   MockScheduler sched;
   MesosSchedulerDriver driver(&sched, frameworkInfo, master.get());

   EXPECT_CALL(sched, registered(_, _, _));

   driver.start();

   Future<vector<Offer> > offers1;
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillOnce(FutureArg<1>(&offers1));

   // Start the first slave.
   slave::Flags flags1 = this->CreateSlaveFlags();
   slave::ProcessIsolator isolator1;

   Try<PID<Slave> > slave1 = this->StartSlave(&isolator1, flags1);
   ASSERT_SOME(slave1);

   AWAIT_READY(offers1);
   ASSERT_EQ(1u, offers1.get().size());

   // Launch a long running task in the first slave.
   TaskInfo task1 = createTask(offers1.get()[0], "sleep 1000");
   vector<TaskInfo> tasks1;
   tasks1.push_back(task1);

   EXPECT_CALL(sched, statusUpdate(_, _))
     .Times(1);

   Future<Nothing> _statusUpdateAcknowledgement1 =
     FUTURE_DISPATCH(slave1.get(), &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers1.get()[0].id(), tasks1);

   // Wait for the ACK to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement1);

   Future<vector<Offer> > offers2;
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillOnce(FutureArg<1>(&offers2));

   // Start the second slave.
   slave::Flags flags2 = this->CreateSlaveFlags();
   slave::ProcessIsolator isolator2;

   Try<PID<Slave> > slave2 = this->StartSlave(&isolator2, flags2);
   ASSERT_SOME(slave2);

   AWAIT_READY(offers2);
   ASSERT_EQ(1u, offers2.get().size());

   // Launch a long running task in each slave.
   TaskInfo task2 = createTask(offers2.get()[0], "sleep 1000");
   vector<TaskInfo> tasks2;
   tasks2.push_back(task2);

   EXPECT_CALL(sched, statusUpdate(_, _))
     .Times(1);

   Future<Nothing> _statusUpdateAcknowledgement2 =
     FUTURE_DISPATCH(slave2.get(), &Slave::_statusUpdateAcknowledgement);

   driver.launchTasks(offers2.get()[0].id(), tasks2);

   // Wait for the ACKs to be checkpointed.
   AWAIT_READY(_statusUpdateAcknowledgement2);

   this->Stop(slave1.get());
   this->Stop(slave2.get());

   Future<Nothing> _recover1 = FUTURE_DISPATCH(_, &Slave::_recover);
   Future<Nothing> _recover2 = FUTURE_DISPATCH(_, &Slave::_recover);

   Future<ReregisterSlaveMessage> reregisterSlave1 =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);
   Future<ReregisterSlaveMessage> reregisterSlave2 =
     FUTURE_PROTOBUF(ReregisterSlaveMessage(), _, _);

   // Restart both slaves using the same flags with new isolators.
   slave::ProcessIsolator isolator3;

   slave1 = this->StartSlave(&isolator3, flags1);
   ASSERT_SOME(slave1);

   slave::ProcessIsolator isolator4;

   slave2 = this->StartSlave(&isolator4, flags2);
   ASSERT_SOME(slave2);

   Clock::pause();

   AWAIT_READY(_recover1);
   AWAIT_READY(_recover2);

   // Wait for slaves to schedule reregister timeout.
   Clock::settle();

   Clock::advance(EXECUTOR_REREGISTER_TIMEOUT);

   // Make sure all pending timeouts are fired.
   Clock::settle();

   Clock::resume();

   // Wait for the slaves to re-register.
   AWAIT_READY(reregisterSlave1);
   AWAIT_READY(reregisterSlave2);

   Future<TaskStatus> status1;
   Future<TaskStatus> status2;
   EXPECT_CALL(sched, statusUpdate(_, _))
     .WillOnce(FutureArg<1>(&status1))
     .WillOnce(FutureArg<1>(&status2))
     .WillRepeatedly(Return());        // Ignore subsequent updates.

   Future<Nothing> executorTerminated1 =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);
   Future<Nothing> executorTerminated2 =
     FUTURE_DISPATCH(_, &Slave::executorTerminated);

   Future<vector<Offer> > offers;
   EXPECT_CALL(sched, resourceOffers(_, _))
     .WillRepeatedly(Return());        // Ignore subsequent offers.

   // Kill both tasks.
   driver.killTask(task1.task_id());
   driver.killTask(task2.task_id());

   AWAIT_READY(status1);
   ASSERT_EQ(TASK_KILLED, status1.get().state());

   AWAIT_READY(status2);
   ASSERT_EQ(TASK_KILLED, status2.get().state());

   AWAIT_READY(executorTerminated1);
   AWAIT_READY(executorTerminated2);

   driver.stop();
   driver.join();

   this->Shutdown(); // Shutdown before isolator(s) get deallocated.
 }