src/tests/storage_local_resource_provider_tests.cpp - mesos - Git at Google

 // Licensed to the Apache Software Foundation (ASF) under one
 // or more contributor license agreements.  See the NOTICE file
 // distributed with this work for additional information
 // regarding copyright ownership.  The ASF licenses this file
 // to you under the Apache License, Version 2.0 (the
 // "License"); you may not use this file except in compliance
 // with the License.  You may obtain a copy of the License at
 //
 //     http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.

 #include <process/clock.hpp>
 #include <process/future.hpp>
 #include <process/http.hpp>
 #include <process/gtest.hpp>
 #include <process/gmock.hpp>

 #include <stout/hashmap.hpp>
 #include <stout/uri.hpp>

 #include <stout/os/realpath.hpp>

 #include "csi/paths.hpp"
 #include "csi/state.hpp"

 #include "linux/fs.hpp"

 #include "master/detector/standalone.hpp"

 #include "module/manager.hpp"

 #include "slave/container_daemon_process.hpp"
 #include "slave/paths.hpp"
 #include "slave/state.hpp"

 #include "slave/containerizer/fetcher.hpp"

 #include "slave/containerizer/mesos/containerizer.hpp"

 #include "tests/disk_profile_server.hpp"
 #include "tests/flags.hpp"
 #include "tests/mesos.hpp"

 namespace http = process::http;

 using std::list;
 using std::shared_ptr;
 using std::string;
 using std::vector;

 using mesos::internal::slave::ContainerDaemonProcess;

 using mesos::master::detector::MasterDetector;
 using mesos::master::detector::StandaloneMasterDetector;

 using process::Clock;
 using process::Future;
 using process::Owned;
 using process::Promise;
 using process::post;

 using testing::AtMost;
 using testing::DoAll;
 using testing::Not;
 using testing::Sequence;

 namespace mesos {
 namespace internal {
 namespace tests {

 constexpr char URI_DISK_PROFILE_ADAPTOR_NAME[] =
   "org_apache_mesos_UriDiskProfileAdaptor";

 constexpr char TEST_SLRP_TYPE[] = "org.apache.mesos.rp.local.storage";
 constexpr char TEST_SLRP_NAME[] = "test";


 class StorageLocalResourceProviderTest
   : public ContainerizerTest<slave::MesosContainerizer>
 {
 public:
   void SetUp() override
   {
     ContainerizerTest<slave::MesosContainerizer>::SetUp();

     resourceProviderConfigDir =
       path::join(sandbox.get(), "resource_provider_configs");
     ASSERT_SOME(os::mkdir(resourceProviderConfigDir));
   }

   void TearDown() override
   {
     // Unload modules.
     foreach (const Modules::Library& library, modules.libraries()) {
       foreach (const Modules::Library::Module& module, library.modules()) {
         if (module.has_name()) {
           ASSERT_SOME(modules::ModuleManager::unload(module.name()));
         }
       }
     }

     foreach (const string& slaveWorkDir, slaveWorkDirs) {
       // Clean up CSI endpoint directories if there is any.
       const string csiRootDir = slave::paths::getCsiRootDir(slaveWorkDir);

       Try<list<string>> csiContainerPaths =
         csi::paths::getContainerPaths(csiRootDir, "*", "*");
       ASSERT_SOME(csiContainerPaths);

       foreach (const string& path, csiContainerPaths.get()) {
         Try<csi::paths::ContainerPath> containerPath =
           csi::paths::parseContainerPath(csiRootDir, path);
         ASSERT_SOME(containerPath);

         Result<string> endpointDir =
           os::realpath(csi::paths::getEndpointDirSymlinkPath(
               csiRootDir,
               containerPath->type,
               containerPath->name,
               containerPath->containerId));

         if (endpointDir.isSome()) {
           ASSERT_SOME(os::rmdir(endpointDir.get()));
         }
       }
     }

     ContainerizerTest<slave::MesosContainerizer>::TearDown();
   }

   slave::Flags CreateSlaveFlags() override
   {
     slave::Flags flags =
       ContainerizerTest<slave::MesosContainerizer>::CreateSlaveFlags();

     // Store the agent work directory for cleaning up CSI endpoint
     // directories during teardown.
     // NOTE: DO NOT change the work directory afterward.
     slaveWorkDirs.push_back(flags.work_dir);

     return flags;
   }

   void loadUriDiskProfileAdaptorModule(
       const string& uri,
       const Option<Duration> pollInterval = None())
   {
     const string libraryPath = getModulePath("uri_disk_profile_adaptor");

     Modules::Library* library = modules.add_libraries();
     library->set_name("uri_disk_profile_adaptor");
     library->set_file(libraryPath);

     Modules::Library::Module* module = library->add_modules();
     module->set_name(URI_DISK_PROFILE_ADAPTOR_NAME);

     Parameter* _uri = module->add_parameters();
     _uri->set_key("uri");
     _uri->set_value(uri);

     if (pollInterval.isSome()) {
       Parameter* _pollInterval = module->add_parameters();
       _pollInterval->set_key("poll_interval");
       _pollInterval->set_value(stringify(pollInterval.get()));
     }

     ASSERT_SOME(modules::ModuleManager::load(modules));
   }

   void setupResourceProviderConfig(
       const Bytes& capacity,
       const Option<string> volumes = None())
   {
     const string testCsiPluginName = "test_csi_plugin";

     const string testCsiPluginPath =
       path::join(tests::flags.build_dir, "src", "test-csi-plugin");

     const string testCsiPluginWorkDir =
       path::join(sandbox.get(), testCsiPluginName);
     ASSERT_SOME(os::mkdir(testCsiPluginWorkDir));

     Try<string> resourceProviderConfig = strings::format(
         R"~(
         {
           "type": "%s",
           "name": "%s",
           "default_reservations": [
             {
               "type": "DYNAMIC",
               "role": "storage"
             }
           ],
           "storage": {
             "plugin": {
               "type": "org.apache.mesos.csi.test",
               "name": "%s",
               "containers": [
                 {
                   "services": [
                     "CONTROLLER_SERVICE",
                     "NODE_SERVICE"
                   ],
                   "command": {
                     "shell": false,
                     "value": "%s",
                     "arguments": [
                       "%s",
                       "--available_capacity=%s",
                       "--volumes=%s",
                       "--work_dir=%s"
                     ]
                   }
                 }
               ]
             }
           }
         }
         )~",
         TEST_SLRP_TYPE,
         TEST_SLRP_NAME,
         testCsiPluginName,
         testCsiPluginPath,
         testCsiPluginPath,
         stringify(capacity),
         volumes.getOrElse(""),
         testCsiPluginWorkDir);

     ASSERT_SOME(resourceProviderConfig);

     ASSERT_SOME(os::write(
         path::join(resourceProviderConfigDir, "test.json"),
         resourceProviderConfig.get()));
   }

   // Create a JSON string representing a disk profile mapping containing the
   // given profile.
   static string createDiskProfileMapping(const string& profile)
   {
     Try<string> diskProfileMapping = strings::format(
         R"~(
         {
           "profile_matrix": {
             "%s": {
               "csi_plugin_type_selector": {
                 "plugin_type": "org.apache.mesos.csi.test"
               },
               "volume_capabilities": {
                 "mount": {},
                 "access_mode": {
                   "mode": "SINGLE_NODE_WRITER"
                 }
               }
             }
           }
         }
         )~",
         profile);

     // This extra closure is necessary in order to use `ASSERT_*`, as
     // these macros require a void return type.
     [&] { ASSERT_SOME(diskProfileMapping); }();

     return diskProfileMapping.get();
   }

   string metricName(const string& basename)
   {
     return "resource_providers/" + stringify(TEST_SLRP_TYPE) + "." +
       stringify(TEST_SLRP_NAME) + "/" + basename;
   }

 protected:
   Modules modules;
   vector<string> slaveWorkDirs;
   string resourceProviderConfigDir;
 };


 // This test verifies that a storage local resource provider can report
 // no resource and recover from this state.
 TEST_F(StorageLocalResourceProviderTest, ROOT_NoResource)
 {
   Clock::pause();

   setupResourceProviderConfig(Bytes(0));

   Try<Owned<cluster::Master>> master = StartMaster();
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration and prevent retry.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());
   EXPECT_EQ(
       0,
       updateSlave2->resource_providers().providers(0).total_resources_size());

   Clock::pause();

   // Restart the agent.
   slave.get()->terminate();

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave4 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave3 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration and prevent retry.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(updateSlave3);

   Clock::resume();

   AWAIT_READY(updateSlave4);
   ASSERT_TRUE(updateSlave4->has_resource_providers());
   ASSERT_EQ(1, updateSlave4->resource_providers().providers_size());
   EXPECT_EQ(
       0,
       updateSlave4->resource_providers().providers(0).total_resources_size());
 }


 // This test verifies that any zero-sized volume reported by a CSI
 // plugin will be ignored by the storage local resource provider.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ZeroSizedDisk)
 {
   Clock::pause();

   setupResourceProviderConfig(Bytes(0), "volume0:0B");

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration and prevent retry.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Option<Resource> volume;
   foreach (const Resource& resource,
            updateSlave2->resource_providers().providers(0).total_resources()) {
     if (Resources::hasResourceProvider(resource)) {
       volume = resource;
     }
   }

   ASSERT_NONE(volume);
 }


 // This test verifies that the storage local resource provider can
 // handle disks less than 1MB correctly.
 TEST_F(StorageLocalResourceProviderTest, ROOT_SmallDisk)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Kilobytes(512), "volume0:512KB");

   master::Flags masterFlags = CreateMasterFlags();

   // Use a small allocation interval to speed up the test. We do this
   // instead of manipulating the clock to keep the test concise and
   // avoid waiting for `UpdateSlaveMessage`s and pausing/resuming the
   // clock multiple times.
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to receive offers.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   Future<vector<Offer>> rawDisksOffers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that do not contain wanted resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We expect to receive an offer that contains a storage pool and a
   // pre-existing volume.
   auto isStoragePool = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW &&
       !r.disk().source().has_id() &&
       r.disk().source().has_profile();
   };

   auto isPreExistingVolume = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_id() &&
       !r.disk().source().has_profile();
   };

   // Since the resource provider always reports the pre-existing volume,
   // but only reports the storage pool after it gets the profile, an
   // offer containing the latter will also contain the former.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       isStoragePool)))
     .WillOnce(FutureArg<1>(&rawDisksOffers));

   driver.start();

   AWAIT_READY(rawDisksOffers);
   ASSERT_FALSE(rawDisksOffers->empty());

   Option<Resource> storagePool;
   Option<Resource> preExistingVolume;
   foreach (const Resource& resource, rawDisksOffers->at(0).resources()) {
     if (isStoragePool(resource)) {
       storagePool = resource;
     } else if (isPreExistingVolume(resource)) {
       preExistingVolume = resource;
     }
   }

   ASSERT_SOME(storagePool);
   EXPECT_EQ(
       Kilobytes(512),
       Bytes(storagePool->scalar().value() * Bytes::MEGABYTES));

   ASSERT_SOME(preExistingVolume);
   EXPECT_EQ(
       Kilobytes(512),
       Bytes(preExistingVolume->scalar().value() * Bytes::MEGABYTES));
 }


 // This test verifies that a framework can receive offers having new storage
 // pools from the storage local resource provider after a profile appears.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ProfileAppeared)
 {
   Clock::pause();

   Future<shared_ptr<TestDiskProfileServer>> server =
     TestDiskProfileServer::create();
   AWAIT_READY(server);

   Promise<http::Response> updatedProfileMapping;
   EXPECT_CALL(*server.get()->process, profiles(_))
     .WillOnce(Return(http::OK("{}")))
     .WillOnce(Return(updatedProfileMapping.future()));

   const Duration pollInterval = Seconds(10);
   loadUriDiskProfileAdaptorModule(
       stringify(server.get()->process->url()),
       pollInterval);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration and prevent retry.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());

   Clock::pause();

   // Register a framework to receive offers.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   Future<vector<Offer>> offersBeforeProfileFound;
   Future<vector<Offer>> offersAfterProfileFound;
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillOnce(DoAll(
         FutureArg<1>(&offersBeforeProfileFound),
         DeclineOffers(declineFilters)))
     .WillOnce(FutureArg<1>(&offersAfterProfileFound));

   driver.start();

   AWAIT_READY(offersBeforeProfileFound);
   ASSERT_FALSE(offersBeforeProfileFound->empty());

   // The offer should not have any resource from the resource provider before
   // the profile appears.
   Resources resourceProviderResources =
     Resources(offersBeforeProfileFound->at(0).resources())
     .filter(&Resources::hasResourceProvider);

   EXPECT_TRUE(resourceProviderResources.empty());

   // Trigger another poll for profiles. The framework will not receive an offer
   // because there is no change in resources yet.
   Clock::advance(pollInterval);
   Clock::settle();

   // Update the disk profile mapping.
   updatedProfileMapping.set(http::OK(createDiskProfileMapping("test")));

   // Advance the clock to make sure another allocation is triggered.
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offersAfterProfileFound);
   ASSERT_FALSE(offersAfterProfileFound->empty());

   // A storage pool is a RAW disk that has a profile but no ID.
   auto isStoragePool = [](const Resource& r, const string& profile) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW &&
       !r.disk().source().has_id() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == profile;
   };

   // A new storage pool with profile "test" should show up now.
   Resources storagePools =
     Resources(offersAfterProfileFound->at(0).resources())
     .filter(std::bind(isStoragePool, lambda::_1, "test"));

   EXPECT_FALSE(storagePools.empty());
 }


 // This test verifies that the storage local resource provider can
 // create then destroy a new volume from a storage pool.
 TEST_F(StorageLocalResourceProviderTest, ROOT_CreateDestroyDisk)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a RAW disk resource after `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Destroy the created volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {volumeCreatedOffers->at(0).id()},
       {DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   Option<Resource> destroyed;

   foreach (const Resource& resource, volumeDestroyedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       destroyed = resource;
       break;
     }
   }

   ASSERT_SOME(destroyed);
   ASSERT_FALSE(destroyed->disk().source().has_id());
   ASSERT_FALSE(destroyed->disk().source().has_metadata());
   ASSERT_FALSE(destroyed->disk().source().has_mount());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that the storage local resource provider can
 // destroy a volume created from a storage pool after recovery.
 TEST_F(StorageLocalResourceProviderTest, ROOT_CreateDestroyDiskRecovery)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a MOUNT disk resource after the agent recovers
   //      from a failover.
   //   4. One containing a RAW disk resource after `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> slaveRecoveredOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Restart the agent.
   EXPECT_CALL(sched, offerRescinded(_, _));

   slave.get()->terminate();

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&slaveRecoveredOffers));

   slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRecoveredOffers);
   ASSERT_FALSE(slaveRecoveredOffers->empty());

   // Destroy the created volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {slaveRecoveredOffers->at(0).id()},
       {DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   Option<Resource> destroyed;

   foreach (const Resource& resource, volumeDestroyedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       destroyed = resource;
       break;
     }
   }

   ASSERT_SOME(destroyed);
   ASSERT_FALSE(destroyed->disk().source().has_id());
   ASSERT_FALSE(destroyed->disk().source().has_metadata());
   ASSERT_FALSE(destroyed->disk().source().has_mount());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that a framework cannot create a volume during and after
 // the profile disappears, and destroying a volume with a stale profile will
 // recover the freed disk with another appeared profile.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ProfileDisappeared)
 {
   Clock::pause();

   Future<shared_ptr<TestDiskProfileServer>> server =
     TestDiskProfileServer::create();
   AWAIT_READY(server);

   Promise<http::Response> updatedProfileMapping;
   EXPECT_CALL(*server.get()->process, profiles(_))
     .WillOnce(Return(http::OK(createDiskProfileMapping("test1"))))
     .WillOnce(Return(updatedProfileMapping.future()));

   const Duration pollInterval = Seconds(10);
   loadUriDiskProfileAdaptorModule(
       stringify(server.get()->process->url()),
       pollInterval);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";
   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration and prevent retry.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());

   Clock::pause();

   // Register a framework to receive offers.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. A 4GB RAW disk with profile 'test1' before the 1st `CREATE_DISK`.
   //   2. A 2GB MOUNT disk and a 2GB RAW disk, both with profile 'test1', after
   //      the 1st `CREATE_DISK` finishes.
   //   3. A 2GB MOUNT disk with profile 'test1' and a 2GB RAW disk with profile
   //      'test2', after the profile mapping is updated and the 2nd
   //      `CREATE_DISK` fails due to a mismatched resource version.
   //   4. A 4GB RAW disk with profile 'test2', after the `DESTROY_DISK`.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> profileDisappearedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       &Resources::hasResourceProvider)))
     .WillOnce(FutureArg<1>(&rawDiskOffers))
     .WillOnce(FutureArg<1>(&volumeCreatedOffers))
     .WillOnce(FutureArg<1>(&profileDisappearedOffers))
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers))
     .WillRepeatedly(Return()); // Ignore subsequent offers.

   driver.start();

   // NOTE: If the framework has not declined an unwanted offer yet when the
   // resource provider reports its RAW resources, the new allocation triggered
   // by this update won't generate an allocatable offer due to no CPU and memory
   // resources. So we first settle the clock to ensure that the unwanted offer
   // has been declined, then advance the clock to trigger another allocation.
   Clock::settle();
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   auto hasSourceTypeAndProfile = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type,
       const string& profile) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == type &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == profile;
   };

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   // Create a volume with profile 'test1'.
   {
     Resources raw =
       Resources(rawDiskOffers->at(0).resources()).filter(std::bind(
           hasSourceTypeAndProfile,
           lambda::_1,
           Resource::DiskInfo::Source::RAW,
           "test1"));

     ASSERT_SOME_EQ(Gigabytes(4), raw.disk());

     // Just use 2GB of the storage pool.
     Resource source = *raw.begin();
     source.mutable_scalar()->set_value(
         (double) Gigabytes(2).bytes() / Bytes::MEGABYTES);

     Future<UpdateOperationStatusMessage> createVolumeStatus =
       FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

     driver.acceptOffers(
         {rawDiskOffers->at(0).id()},
         {CREATE_DISK(source, Resource::DiskInfo::Source::MOUNT)},
         acceptFilters);

     AWAIT_READY(createVolumeStatus);
     EXPECT_EQ(OPERATION_FINISHED, createVolumeStatus->status().state());
   }

   // Advance the clock to trigger another allocation.
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   // We drop the agent update (which is triggered by the changes in the known
   // set of profiles) to simulate the situation where the update races with
   // an offer operation.
   Future<UpdateSlaveMessage> updateSlave3 =
     DROP_PROTOBUF(UpdateSlaveMessage(), _, _);

   // Trigger another poll for profiles. Profile 'test1' will disappear and
   // profile 'test2' will appear.
   //
   // NOTE: We advance the clock before updating the disk profile mapping so
   // there will only be one poll.
   Clock::advance(pollInterval);

   // Update the disk profile mapping.
   updatedProfileMapping.set(http::OK(createDiskProfileMapping("test2")));

   AWAIT_READY(updateSlave3);

   // Try to create another volume with profile 'test1', which will be dropped
   // due to a mismatched resource version.
   {
     Resources raw =
       Resources(volumeCreatedOffers->at(0).resources()).filter(std::bind(
           hasSourceTypeAndProfile,
           lambda::_1,
           Resource::DiskInfo::Source::RAW,
           "test1"));

     ASSERT_SOME_EQ(Gigabytes(2), raw.disk());

     Future<UpdateOperationStatusMessage> createVolumeStatus =
       FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

     driver.acceptOffers(
         {volumeCreatedOffers->at(0).id()},
         {CREATE_DISK(*raw.begin(), Resource::DiskInfo::Source::MOUNT)},
         acceptFilters);

     AWAIT_READY(createVolumeStatus);
     EXPECT_EQ(OPERATION_DROPPED, createVolumeStatus->status().state());
   }

   // Forward the dropped agent update to trigger another allocation.
   post(slave.get()->pid, master.get()->pid, updateSlave3.get());

   AWAIT_READY(profileDisappearedOffers);
   ASSERT_FALSE(profileDisappearedOffers->empty());

   // Destroy the volume with profile 'test1', which will trigger an agent update
   // to recover the freed disk with profile 'test2' and thus another allocation.
   {
     Resources volumes =
       Resources(profileDisappearedOffers->at(0).resources()).filter(std::bind(
           hasSourceTypeAndProfile,
           lambda::_1,
           Resource::DiskInfo::Source::MOUNT,
           "test1"));

     ASSERT_SOME_EQ(Gigabytes(2), volumes.disk());

     Future<UpdateOperationStatusMessage> destroyVolumeStatus =
       FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

     driver.acceptOffers(
         {profileDisappearedOffers->at(0).id()},
         {DESTROY_DISK(*volumes.begin())},
         acceptFilters);

     AWAIT_READY(destroyVolumeStatus);
     EXPECT_EQ(OPERATION_FINISHED, destroyVolumeStatus->status().state());
   }

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   // Check that the freed disk has been recovered with profile 'test2'.
   {
     Resources storagePool =
       Resources(volumeDestroyedOffers->at(0).resources()).filter(std::bind(
           hasSourceTypeAndProfile,
           lambda::_1,
           Resource::DiskInfo::Source::RAW,
           "test2"));

     EXPECT_SOME_EQ(Gigabytes(4), storagePool.disk());
   }
 }


 // This test verifies that if an agent is registered with a new ID,
 // the ID of the resource provider would be changed as well, and any
 // created volume becomes a pre-existing volume.
 TEST_F(StorageLocalResourceProviderTest, ROOT_AgentRegisteredWithNewId)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a RAW pre-existing volume after the agent
   //      is registered with a new ID.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> slaveRecoveredOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // Before the agent fails over, we are interested in any storage pool or
   // volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> createdVolume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       createdVolume = resource;
       break;
     }
   }

   ASSERT_SOME(createdVolume);
   ASSERT_TRUE(createdVolume->has_provider_id());
   ASSERT_TRUE(createdVolume->disk().source().has_id());
   ASSERT_TRUE(createdVolume->disk().source().has_metadata());
   ASSERT_TRUE(createdVolume->disk().source().has_mount());
   ASSERT_TRUE(createdVolume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(createdVolume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label,
            createdVolume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Shut down the agent.
   EXPECT_CALL(sched, offerRescinded(_, _));

   slave.get()->terminate();

   // Remove the `latest` symlink to register the agent with a new ID.
   const string metaDir = slave::paths::getMetaRootDir(slaveFlags.work_dir);
   ASSERT_SOME(os::rm(slave::paths::getLatestSlavePath(metaDir)));

   // A new registration would trigger another `SlaveRegisteredMessage`.
   slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, Not(slave.get()->pid));

   // After the agent fails over, any volume created before becomes a
   // pre-existing volume, which has an ID but no profile.
   auto isPreExistingVolume = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_id() &&
       !r.disk().source().has_profile();
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       isPreExistingVolume)))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&slaveRecoveredOffers));

   slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   AWAIT_READY(slaveRecoveredOffers);
   ASSERT_FALSE(slaveRecoveredOffers->empty());

   Option<Resource> preExistingVolume;

   foreach (const Resource& resource, slaveRecoveredOffers->at(0).resources()) {
     if (isPreExistingVolume(resource) &&
         resource.disk().source().type() == Resource::DiskInfo::Source::RAW) {
       preExistingVolume = resource;
     }
   }

   ASSERT_SOME(preExistingVolume);
   ASSERT_TRUE(preExistingVolume->has_provider_id());
   ASSERT_NE(createdVolume->provider_id(), preExistingVolume->provider_id());
   ASSERT_EQ(
       createdVolume->disk().source().id(),
       preExistingVolume->disk().source().id());
 }


 // This test verifies that the storage local resource provider can
 // publish a volume required by a task, then destroy the published
 // volume after the task finishes.
 TEST_F(StorageLocalResourceProviderTest, ROOT_PublishResources)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a persistent volume after `CREATE` and `LAUNCH`.
   //   4. One containing the original RAW disk resource after `DESTROY`
   //      and `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> taskFinishedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Put a file into the volume.
   ASSERT_SOME(os::touch(path::join(volumePath.get(), "file")));

   // Create a persistent volume on the CSI volume, then launch a task to
   // use the persistent volume.
   Resource persistentVolume = volume.get();
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_id(id::UUID::random().toString());
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_principal(framework.principal());
   persistentVolume.mutable_disk()->mutable_volume()
     ->set_container_path("volume");
   persistentVolume.mutable_disk()->mutable_volume()->set_mode(Volume::RW);

   Future<TaskStatus> taskStarting;
   Future<TaskStatus> taskRunning;
   Future<TaskStatus> taskFinished;

   EXPECT_CALL(sched, statusUpdate(&driver, _))
     .WillOnce(FutureArg<1>(&taskStarting))
     .WillOnce(FutureArg<1>(&taskRunning))
     .WillOnce(FutureArg<1>(&taskFinished));

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
       persistentVolume)))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&taskFinishedOffers));

   driver.acceptOffers(
       {volumeCreatedOffers->at(0).id()},
       {CREATE(persistentVolume),
        LAUNCH({createTask(
            volumeCreatedOffers->at(0).slave_id(),
            persistentVolume,
            createCommandInfo("test -f " + path::join("volume", "file")))})},
       acceptFilters);

   AWAIT_READY(taskStarting);
   EXPECT_EQ(TASK_STARTING, taskStarting->state());

   AWAIT_READY(taskRunning);
   EXPECT_EQ(TASK_RUNNING, taskRunning->state());

   AWAIT_READY(taskFinished);
   EXPECT_EQ(TASK_FINISHED, taskFinished->state());

   AWAIT_READY(taskFinishedOffers);

   // Destroy the persistent volume and the CSI volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(source.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {taskFinishedOffers->at(0).id()},
       {DESTROY(persistentVolume),
        DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that the storage local resource provider can
 // destroy a published volume after recovery.
 TEST_F(StorageLocalResourceProviderTest, ROOT_PublishResourcesRecovery)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a persistent volume after `CREATE` and `LAUNCH`.
   //   4. One containing the same persistent volume after the agent
   //      recovers from a failover.
   //   5. One containing the same persistent volume after another `LAUNCH`.
   //   6. One containing the original RAW disk resource after `DESTROY`
   //      and `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> task1FinishedOffers;
   Future<vector<Offer>> slaveRecoveredOffers;
   Future<vector<Offer>> task2FinishedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Create a persistent volume on the CSI volume, then launch a task to
   // use the persistent volume.
   Resource persistentVolume = volume.get();
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_id(id::UUID::random().toString());
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_principal(framework.principal());
   persistentVolume.mutable_disk()->mutable_volume()
     ->set_container_path("volume");
   persistentVolume.mutable_disk()->mutable_volume()->set_mode(Volume::RW);

   {
     Future<TaskStatus> taskStarting;
     Future<TaskStatus> taskRunning;
     Future<TaskStatus> taskFinished;

     EXPECT_CALL(sched, statusUpdate(&driver, _))
       .WillOnce(FutureArg<1>(&taskStarting))
       .WillOnce(FutureArg<1>(&taskRunning))
       .WillOnce(FutureArg<1>(&taskFinished));

     EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
         persistentVolume)))
       .InSequence(offers)
       .WillOnce(FutureArg<1>(&task1FinishedOffers));

     driver.acceptOffers(
         {volumeCreatedOffers->at(0).id()},
         {CREATE(persistentVolume),
          LAUNCH({createTask(
              volumeCreatedOffers->at(0).slave_id(),
              persistentVolume,
              createCommandInfo("touch " + path::join("volume", "file")))})},
         acceptFilters);

     AWAIT_READY(taskStarting);
     EXPECT_EQ(TASK_STARTING, taskStarting->state());

     AWAIT_READY(taskRunning);
     EXPECT_EQ(TASK_RUNNING, taskRunning->state());

     AWAIT_READY(taskFinished);
     EXPECT_EQ(TASK_FINISHED, taskFinished->state());
   }

   AWAIT_READY(task1FinishedOffers);

   // Restart the agent.
   EXPECT_CALL(sched, offerRescinded(_, _));

   slave.get()->terminate();

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
       persistentVolume)))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&slaveRecoveredOffers));

   slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRecoveredOffers);
   ASSERT_FALSE(slaveRecoveredOffers->empty());

   // Launch another task to read the file that is created by the
   // previous task on the persistent volume.
   {
     Future<TaskStatus> taskStarting;
     Future<TaskStatus> taskRunning;
     Future<TaskStatus> taskFinished;

     EXPECT_CALL(sched, statusUpdate(&driver, _))
       .WillOnce(FutureArg<1>(&taskStarting))
       .WillOnce(FutureArg<1>(&taskRunning))
       .WillOnce(FutureArg<1>(&taskFinished));

     EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
         persistentVolume)))
       .InSequence(offers)
       .WillOnce(FutureArg<1>(&task2FinishedOffers));

     driver.acceptOffers(
         {slaveRecoveredOffers->at(0).id()},
         {LAUNCH({createTask(
              slaveRecoveredOffers->at(0).slave_id(),
              persistentVolume,
              createCommandInfo("test -f " + path::join("volume", "file")))})},
         acceptFilters);

     AWAIT_READY(taskStarting);
     EXPECT_EQ(TASK_STARTING, taskStarting->state());

     AWAIT_READY(taskRunning);
     EXPECT_EQ(TASK_RUNNING, taskRunning->state());

     AWAIT_READY(taskFinished);
     EXPECT_EQ(TASK_FINISHED, taskFinished->state());
   }

   AWAIT_READY(task2FinishedOffers);

   // Destroy the persistent volume and the CSI volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(source.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {task2FinishedOffers->at(0).id()},
       {DESTROY(persistentVolume),
        DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that the storage local resource provider can
 // destroy a published volume after agent reboot.
 TEST_F(StorageLocalResourceProviderTest, ROOT_PublishResourcesReboot)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing a persistent volume after `CREATE` and `LAUNCH`.
   //   4. One containing the same persistent volume after the agent
   //      recovers from a failover.
   //   5. One containing the same persistent volume after another `LAUNCH`.
   //   6. One containing the original RAW disk resource after `DESTROY`
   //      and `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> task1FinishedOffers;
   Future<vector<Offer>> slaveRecoveredOffers;
   Future<vector<Offer>> task2FinishedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   // Create a persistent volume on the CSI volume, then launch a task to
   // use the persistent volume.
   Resource persistentVolume = volume.get();
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_id(id::UUID::random().toString());
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_principal(framework.principal());
   persistentVolume.mutable_disk()->mutable_volume()
     ->set_container_path("volume");
   persistentVolume.mutable_disk()->mutable_volume()->set_mode(Volume::RW);

   {
     Future<TaskStatus> taskStarting;
     Future<TaskStatus> taskRunning;
     Future<TaskStatus> taskFinished;

     EXPECT_CALL(sched, statusUpdate(&driver, _))
       .WillOnce(FutureArg<1>(&taskStarting))
       .WillOnce(FutureArg<1>(&taskRunning))
       .WillOnce(FutureArg<1>(&taskFinished));

     EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
         persistentVolume)))
       .InSequence(offers)
       .WillOnce(FutureArg<1>(&task1FinishedOffers));

     driver.acceptOffers(
         {volumeCreatedOffers->at(0).id()},
         {CREATE(persistentVolume),
          LAUNCH({createTask(
              volumeCreatedOffers->at(0).slave_id(),
              persistentVolume,
              createCommandInfo("touch " + path::join("volume", "file")))})},
         acceptFilters);

     AWAIT_READY(taskStarting);
     EXPECT_EQ(TASK_STARTING, taskStarting->state());

     AWAIT_READY(taskRunning);
     EXPECT_EQ(TASK_RUNNING, taskRunning->state());

     AWAIT_READY(taskFinished);
     EXPECT_EQ(TASK_FINISHED, taskFinished->state());
   }

   AWAIT_READY(task1FinishedOffers);

   // Destruct the agent to shut down all containers.
   EXPECT_CALL(sched, offerRescinded(_, _));

   slave->reset();

   // Modify the boot ID to simulate a reboot.
   ASSERT_SOME(os::write(
       slave::paths::getBootIdPath(
           slave::paths::getMetaRootDir(slaveFlags.work_dir)),
       "rebooted! ;)"));

   const string csiRootDir = slave::paths::getCsiRootDir(slaveFlags.work_dir);

   Try<list<string>> volumePaths =
     csi::paths::getVolumePaths(csiRootDir, "*", "*");
   ASSERT_SOME(volumePaths);
   ASSERT_FALSE(volumePaths->empty());

   foreach (const string& path, volumePaths.get()) {
     Try<csi::paths::VolumePath> volumePath =
       csi::paths::parseVolumePath(csiRootDir, path);
     ASSERT_SOME(volumePath);

     const string volumeStatePath = csi::paths::getVolumeStatePath(
         csiRootDir,
         volumePath->type,
         volumePath->name,
         volumePath->volumeId);

     Result<csi::state::VolumeState> volumeState =
       slave::state::read<csi::state::VolumeState>(volumeStatePath);
     ASSERT_SOME(volumeState);

     if (volumeState->state() == csi::state::VolumeState::PUBLISHED) {
       volumeState->set_boot_id("rebooted! ;)");
       ASSERT_SOME(slave::state::checkpoint(volumeStatePath, volumeState.get()));
     }
   }

   // Unmount all CSI volumes to simulate a reboot.
   ASSERT_SOME(fs::unmountAll(csiRootDir));

   // Restart the agent.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
       persistentVolume)))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&slaveRecoveredOffers));

   slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRecoveredOffers);
   ASSERT_FALSE(slaveRecoveredOffers->empty());

   // Launch another task to read the file that is created by the
   // previous task on the persistent volume.
   {
     Future<TaskStatus> taskStarting;
     Future<TaskStatus> taskRunning;
     Future<TaskStatus> taskFinished;

     EXPECT_CALL(sched, statusUpdate(&driver, _))
       .WillOnce(FutureArg<1>(&taskStarting))
       .WillOnce(FutureArg<1>(&taskRunning))
       .WillOnce(FutureArg<1>(&taskFinished));

     EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
         persistentVolume)))
       .InSequence(offers)
       .WillOnce(FutureArg<1>(&task2FinishedOffers));

     driver.acceptOffers(
         {slaveRecoveredOffers->at(0).id()},
         {LAUNCH({createTask(
              slaveRecoveredOffers->at(0).slave_id(),
              persistentVolume,
              createCommandInfo("test -f " + path::join("volume", "file")))})},
         acceptFilters);

     AWAIT_READY(taskStarting);
     EXPECT_EQ(TASK_STARTING, taskStarting->state());

     AWAIT_READY(taskRunning);
     EXPECT_EQ(TASK_RUNNING, taskRunning->state());

     AWAIT_READY(taskFinished);
     EXPECT_EQ(TASK_FINISHED, taskFinished->state());
   }

   AWAIT_READY(task2FinishedOffers);

   // Destroy the persistent volume and the CSI volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(source.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {task2FinishedOffers->at(0).id()},
       {DESTROY(persistentVolume),
        DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that the storage local resource provider can
 // restart its CSI plugin after it is killed and continue to work
 // properly.
 TEST_F(
     StorageLocalResourceProviderTest,
     ROOT_PublishUnpublishResourcesPluginKilled)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   slave::Fetcher fetcher(slaveFlags);

   Try<slave::MesosContainerizer*> _containerizer =
     slave::MesosContainerizer::create(slaveFlags, false, &fetcher);
   ASSERT_SOME(_containerizer);

   Owned<slave::MesosContainerizer> containerizer(_containerizer.get());

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave =
     StartSlave(detector.get(), containerizer.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing the same MOUNT disk resource after `CREATE`,
   //      `LAUNCH` and `DESTROY`.
   //   4. One containing the same RAW disk resource after `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> taskFinishedOffers;
   Future<vector<Offer>> volumeDestroyedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // Get the ID of the CSI plugin container.
   Future<hashset<ContainerID>> pluginContainers = containerizer->containers();

   AWAIT_READY(pluginContainers);
   ASSERT_EQ(1u, pluginContainers->size());

   const ContainerID& pluginContainerId = *pluginContainers->begin();

   Future<Nothing> pluginRestarted =
     FUTURE_DISPATCH(_, &ContainerDaemonProcess::launchContainer);

   // Kill the plugin container and wait for it to restart.
   Future<int> pluginKilled = containerizer->status(pluginContainerId)
     .then([](const ContainerStatus& status) {
       return os::kill(status.executor_pid(), SIGKILL);
     });

   AWAIT_ASSERT_EQ(0, pluginKilled);
   AWAIT_READY(pluginRestarted);

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   // Check if the volume is actually created by the test CSI plugin.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   EXPECT_TRUE(os::exists(volumePath.get()));

   pluginRestarted =
     FUTURE_DISPATCH(_, &ContainerDaemonProcess::launchContainer);

   // Kill the plugin container and wait for it to restart.
   pluginKilled = containerizer->status(pluginContainerId)
     .then([](const ContainerStatus& status) {
       return os::kill(status.executor_pid(), SIGKILL);
     });

   AWAIT_ASSERT_EQ(0, pluginKilled);
   AWAIT_READY(pluginRestarted);

   // Put a file into the volume.
   ASSERT_SOME(os::touch(path::join(volumePath.get(), "file")));

   // Create a persistent volume on the CSI volume, then launch a task to
   // use the persistent volume.
   Resource persistentVolume = volume.get();
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_id(id::UUID::random().toString());
   persistentVolume.mutable_disk()->mutable_persistence()
     ->set_principal(framework.principal());
   persistentVolume.mutable_disk()->mutable_volume()
     ->set_container_path("volume");
   persistentVolume.mutable_disk()->mutable_volume()->set_mode(Volume::RW);

   Future<TaskStatus> taskStarting;
   Future<TaskStatus> taskRunning;
   Future<TaskStatus> taskFinished;

   EXPECT_CALL(sched, statusUpdate(&driver, _))
     .WillOnce(FutureArg<1>(&taskStarting))
     .WillOnce(FutureArg<1>(&taskRunning))
     .WillOnce(FutureArg<1>(&taskFinished));

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(
       persistentVolume)))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&taskFinishedOffers));

   driver.acceptOffers(
       {volumeCreatedOffers->at(0).id()},
       {CREATE(persistentVolume),
        LAUNCH({createTask(
            volumeCreatedOffers->at(0).slave_id(),
            persistentVolume,
            createCommandInfo("test -f " + path::join("volume", "file")))})},
       acceptFilters);

   AWAIT_READY(taskStarting);
   EXPECT_EQ(TASK_STARTING, taskStarting->state());

   AWAIT_READY(taskRunning);
   EXPECT_EQ(TASK_RUNNING, taskRunning->state());

   AWAIT_READY(taskFinished);
   EXPECT_EQ(TASK_FINISHED, taskFinished->state());

   AWAIT_READY(taskFinishedOffers);

   pluginRestarted =
     FUTURE_DISPATCH(_, &ContainerDaemonProcess::launchContainer);

   // Kill the plugin container and wait for it to restart.
   pluginKilled = containerizer->status(pluginContainerId)
     .then([](const ContainerStatus& status) {
       return os::kill(status.executor_pid(), SIGKILL);
     });

   AWAIT_ASSERT_EQ(0, pluginKilled);
   AWAIT_READY(pluginRestarted);

   // Destroy the persistent volume and the CSI volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(source.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeDestroyedOffers));

   driver.acceptOffers(
       {taskFinishedOffers->at(0).id()},
       {DESTROY(persistentVolume),
        DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(volumeDestroyedOffers);
   ASSERT_FALSE(volumeDestroyedOffers->empty());

   // Check if the volume is actually deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that the storage local resource provider can import a
 // preprovisioned CSI volume as a MOUNT disk of a given profile, and return the
 // space back to the storage pool after destroying the volume.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ImportPreprovisionedVolume)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));

   loadUriDiskProfileAdaptorModule(profilesPath);

   // NOTE: We setup up the resource provider with an extra storage pool, so that
   // when the storage pool is offered, we know that the corresponding profile is
   // known to the resource provider.
   setupResourceProviderConfig(Gigabytes(2), "volume1:2GB");

   Try<Owned<cluster::Master>> master = StartMaster();
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW preprovisioned volumes before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resources after `CREATE_DISK`.
   //   3. One containing a RAW storage pool after `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> diskCreatedOffers;
   Future<vector<Offer>> diskDestroyedOffers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   auto isStoragePool = [](const Resource& r, const string& profile) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW &&
       !r.disk().source().has_id() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == profile;
   };

   // NOTE: Instead of expecting a preprovisioned volume, we expect an offer with
   // a 'test1' storage pool as an indication that the profile is known to the
   // resource provider. The offer should also have the preprovisioned volume.
   // But, an extra offer with the storage pool may be received as a side effect
   // of this workaround, so we decline it if this happens.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(isStoragePool, lambda::_1, "test"))))
     .WillOnce(FutureArg<1>(&rawDiskOffers))
     .WillRepeatedly(DeclineOffers(declineFilters));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_EQ(1u, rawDiskOffers->size());

   auto isPreprovisionedVolume = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW &&
       r.disk().source().has_id() &&
       !r.disk().source().has_profile();
   };

   Resources _preprovisioned = Resources(rawDiskOffers->at(0).resources())
     .filter(isPreprovisionedVolume);

   ASSERT_SOME_EQ(Gigabytes(2), _preprovisioned.disk());

   Resource preprovisioned = *_preprovisioned.begin();

   // Get the volume path of the preprovisioned volume.
   Option<string> volumePath;

   foreach (const Label& label,
            preprovisioned.disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   ASSERT_TRUE(os::exists(volumePath.get()));

   auto isMountDisk = [](const Resource& r, const string& profile) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().type() == Resource::DiskInfo::Source::MOUNT &&
       r.disk().source().has_id() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == profile;
   };

   // Apply profile 'test' to the preprovisioned volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(isMountDisk, lambda::_1, "test"))))
     .WillOnce(FutureArg<1>(&diskCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(preprovisioned, Resource::DiskInfo::Source::MOUNT, "test")},
       acceptFilters);

   AWAIT_READY(diskCreatedOffers);
   ASSERT_EQ(1u, diskCreatedOffers->size());

   Resource created = *Resources(diskCreatedOffers->at(0).resources())
     .filter(std::bind(isMountDisk, lambda::_1, "test"))
     .begin();

   // Destroy the created disk.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(isStoragePool, lambda::_1, "test"))))
     .WillOnce(FutureArg<1>(&diskDestroyedOffers));

   driver.acceptOffers(
       {diskCreatedOffers->at(0).id()},
       {DESTROY_DISK(created)},
       acceptFilters);

   AWAIT_READY(diskDestroyedOffers);
   ASSERT_EQ(1u, diskDestroyedOffers->size());

   Resources raw = Resources(diskDestroyedOffers->at(0).resources())
     .filter(std::bind(isStoragePool, lambda::_1, "test"));

   EXPECT_SOME_EQ(Gigabytes(4), raw.disk());

   // Check if the volume is deleted by the test CSI plugin.
   EXPECT_FALSE(os::exists(volumePath.get()));
 }


 // This test verifies that operation status updates are resent to the master
 // after being dropped en route to it.
 //
 // To accomplish this:
 //   1. Creates a volume from a RAW disk resource.
 //   2. Drops the first `UpdateOperationStatusMessage` from the agent to the
 //      master, so that it isn't acknowledged by the master.
 //   3. Advances the clock and verifies that the agent resends the operation
 //      status update.
 TEST_F(StorageLocalResourceProviderTest, ROOT_RetryOperationStatusUpdate)
 {
   Clock::pause();

   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags flags = CreateSlaveFlags();
   flags.isolation = "filesystem/linux";

   flags.resource_provider_config_dir = resourceProviderConfigDir;
   flags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), flags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(flags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Clock::pause();

   // Register a framework to exercise an operation.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   Future<vector<Offer>> offers;

   // Decline offers without RAW disk resources. The master can send such offers
   // before the resource provider reports its RAW resources, or after receiving
   // the `UpdateOperationStatusMessage`.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers());

   auto isRaw = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(isRaw)))
     .WillOnce(FutureArg<1>(&offers));

   driver.start();

   // NOTE: If the framework has not declined an unwanted offer yet when the
   // resource provider reports its RAW resources, the new allocation triggered
   // by this update won't generate an allocatable offer due to no CPU and memory
   // resources. So we first settle the clock to ensure that the unwanted offer
   // has been declined, then advance the clock to trigger another allocation.
   Clock::settle();
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offers);
   ASSERT_FALSE(offers->empty());

   const Offer& offer = offers->at(0);

   Option<Resource> source;
   foreach (const Resource& resource, offer.resources()) {
     if (isRaw(resource)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // We'll drop the first operation status update from the agent to the master.
   Future<UpdateOperationStatusMessage> droppedUpdateOperationStatusMessage =
     DROP_PROTOBUF(
         UpdateOperationStatusMessage(), slave.get()->pid, master.get()->pid);

   // Create a volume.
   driver.acceptOffers(
       {offer.id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       {});

   AWAIT_READY(droppedUpdateOperationStatusMessage);

   // The SLRP should resend the dropped operation status update after the
   // status update retry interval minimum.
   Future<UpdateOperationStatusMessage> retriedUpdateOperationStatusMessage =
     FUTURE_PROTOBUF(
         UpdateOperationStatusMessage(), slave.get()->pid, master.get()->pid);

   // The master should acknowledge the operation status update.
   Future<AcknowledgeOperationStatusMessage> acknowledgeOperationStatusMessage =
     FUTURE_PROTOBUF(
       AcknowledgeOperationStatusMessage(), master.get()->pid, slave.get()->pid);

   Clock::advance(slave::STATUS_UPDATE_RETRY_INTERVAL_MIN);

   AWAIT_READY(retriedUpdateOperationStatusMessage);
   AWAIT_READY(acknowledgeOperationStatusMessage);

   // The master acknowledged the operation status update, so the SLRP shouldn't
   // send further operation status updates.
   EXPECT_NO_FUTURE_PROTOBUFS(UpdateOperationStatusMessage(), _, _);

   Clock::advance(slave::STATUS_UPDATE_RETRY_INTERVAL_MIN);
   Clock::settle();

   driver.stop();
   driver.join();
 }


 // This test verifies that on agent restarts, unacknowledged operation status
 // updates are resent to the master
 //
 // To accomplish this:
 //   1. Creates a volume from a RAW disk resource.
 //   2. Drops the first `UpdateOperationStatusMessage` from the agent to the
 //      master, so that it isn't acknowledged by the master.
 //   3. Restarts the agent.
 //   4. Verifies that the agent resends the operation status update.
 TEST_F(
     StorageLocalResourceProviderTest,
     ROOT_RetryOperationStatusUpdateAfterRecovery)
 {
   Clock::pause();

   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags flags = CreateSlaveFlags();
   flags.isolation = "filesystem/linux";

   flags.resource_provider_config_dir = resourceProviderConfigDir;
   flags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), flags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(flags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Clock::pause();

   // Register a framework to exercise an operation.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   Future<vector<Offer>> offers;

   // Decline offers without RAW disk resources. The master can send such offers
   // before the resource provider reports its RAW resources, or after receiving
   // the `UpdateOperationStatusMessage`.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers());

   auto isRaw = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(isRaw)))
     .WillOnce(FutureArg<1>(&offers));

   driver.start();

   // NOTE: If the framework has not declined an unwanted offer yet when the
   // resource provider reports its RAW resources, the new allocation triggered
   // by this update won't generate an allocatable offer due to no CPU and memory
   // resources. So we first settle the clock to ensure that the unwanted offer
   // has been declined, then advance the clock to trigger another allocation.
   Clock::settle();
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offers);
   ASSERT_FALSE(offers->empty());

   const Offer& offer = offers->at(0);

   Option<Resource> source;
   foreach (const Resource& resource, offer.resources()) {
     if (isRaw(resource)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   // We'll drop the first operation status update from the agent to the master.
   Future<UpdateOperationStatusMessage> droppedUpdateOperationStatusMessage =
     DROP_PROTOBUF(
         UpdateOperationStatusMessage(), slave.get()->pid, master.get()->pid);

   // Create a volume.
   driver.acceptOffers(
       {offer.id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       {});

   AWAIT_READY(droppedUpdateOperationStatusMessage);

   // Restart the agent.
   slave.get()->terminate();

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   Future<UpdateSlaveMessage> updateSlave4 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave3 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   // Once the agent is restarted, the SLRP should resend the dropped operation
   // status update.
   Future<UpdateOperationStatusMessage> retriedUpdateOperationStatusMessage =
     FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, master.get()->pid);

   // The master should acknowledge the operation status update once.
   Future<AcknowledgeOperationStatusMessage> acknowledgeOperationStatusMessage =
     FUTURE_PROTOBUF(AcknowledgeOperationStatusMessage(), master.get()->pid, _);

   slave = StartSlave(detector.get(), flags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(flags.registration_backoff_factor);

   AWAIT_READY(updateSlave3);

   // Resume the clock so that the CSI plugin's standalone container is created
   // and the SLRP's async loop notices it.
   Clock::resume();

   AWAIT_READY(updateSlave4);
   ASSERT_TRUE(updateSlave4->has_resource_providers());
   ASSERT_EQ(1, updateSlave4->resource_providers().providers_size());

   Clock::pause();

   AWAIT_READY(retriedUpdateOperationStatusMessage);

   AWAIT_READY(acknowledgeOperationStatusMessage);

   // The master has acknowledged the operation status update, so the SLRP
   // shouldn't send further operation status updates.
   EXPECT_NO_FUTURE_PROTOBUFS(UpdateOperationStatusMessage(), _, _);

   Clock::advance(slave::STATUS_UPDATE_RETRY_INTERVAL_MIN);
   Clock::settle();

   driver.stop();
   driver.join();
 }


 // This test verifies that storage local resource provider properly
 // reports the metric related to CSI plugin container terminations.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ContainerTerminationMetric)
 {
   setupResourceProviderConfig(Gigabytes(4));

   Try<Owned<cluster::Master>> master = StartMaster();
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;

   slave::Fetcher fetcher(slaveFlags);

   Try<slave::MesosContainerizer*> _containerizer =
     slave::MesosContainerizer::create(slaveFlags, false, &fetcher);

   ASSERT_SOME(_containerizer);

   Owned<slave::MesosContainerizer> containerizer(_containerizer.get());

   Future<Nothing> pluginConnected =
     FUTURE_DISPATCH(_, &ContainerDaemonProcess::waitContainer);

   Try<Owned<cluster::Slave>> slave = StartSlave(
       detector.get(),
       containerizer.get(),
       slaveFlags);

   ASSERT_SOME(slave);

   AWAIT_READY(pluginConnected);

   JSON::Object snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/container_terminations")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "csi_plugin/container_terminations")));

   // Get the ID of the CSI plugin container.
   Future<hashset<ContainerID>> pluginContainers = containerizer->containers();

   AWAIT_READY(pluginContainers);
   ASSERT_EQ(1u, pluginContainers->size());

   const ContainerID& pluginContainerId = *pluginContainers->begin();

   Future<Nothing> pluginRestarted =
     FUTURE_DISPATCH(_, &ContainerDaemonProcess::launchContainer);

   // Kill the plugin container and wait for it to restart.
   // NOTE: We need to wait for `pluginConnected` before issuing the
   // kill, or it may kill the plugin before it created the endpoint
   // socket and the resource provider would wait for one minute.
   Future<int> pluginKilled = containerizer->status(pluginContainerId)
     .then([](const ContainerStatus& status) {
       return os::kill(status.executor_pid(), SIGKILL);
     });

   AWAIT_ASSERT_EQ(0, pluginKilled);
   AWAIT_READY(pluginRestarted);

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/container_terminations")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/container_terminations")));
 }


 // This test verifies that storage local resource provider properly
 // reports metrics related to operation states.
 // TODO(chhsiao): Currently there is no way to test the `pending` metric for
 // operations since we have no control over the completion of an operation. Once
 // we support out-of-band CSI plugins through domain sockets, we could test this
 // metric against a mock CSI plugin.
 TEST_F(StorageLocalResourceProviderTest, ROOT_OperationStateMetrics)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing the same MOUNT disk resource after a failed
   //      `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> operationFailedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   JSON::Object snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/create_disk/finished")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/create_disk/finished")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/failed")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/destroy_disk/failed")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/dropped")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/destroy_disk/dropped")));

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/create_disk/finished")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/create_disk/finished")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/failed")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/destroy_disk/failed")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/dropped")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/destroy_disk/dropped")));

   // Remove the volume out of band to fail `DESTROY_DISK`.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   ASSERT_SOME(os::rmdir(volumePath.get()));

   // Destroy the created volume, which will fail.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(volume.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&operationFailedOffers))
     .WillRepeatedly(DeclineOffers(declineFilters)); // Decline further offers.

   driver.acceptOffers(
       {volumeCreatedOffers->at(0).id()},
       {DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(operationFailedOffers);
   ASSERT_FALSE(operationFailedOffers->empty());

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/create_disk/finished")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/create_disk/finished")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/failed")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/destroy_disk/failed")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/dropped")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "operations/destroy_disk/dropped")));

   // Destroy the volume again, which will be dropped this time.
   Future<ApplyOperationMessage> applyOperationMessage =
     DROP_PROTOBUF(ApplyOperationMessage(), _, _);

   driver.acceptOffers(
       {operationFailedOffers->at(0).id()},
       {DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(applyOperationMessage);
   ASSERT_TRUE(applyOperationMessage
     ->resource_version_uuid().has_resource_provider_id());

   // Modify the resource version UUID to drop `DESTROY_DISK`.
   Future<UpdateOperationStatusMessage> operationDroppedStatus =
     FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

   ApplyOperationMessage spoofedApplyOperationMessage =
     applyOperationMessage.get();
   spoofedApplyOperationMessage.mutable_resource_version_uuid()->mutable_uuid()
     ->set_value(id::UUID::random().toBytes());

   post(master.get()->pid, slave.get()->pid, spoofedApplyOperationMessage);

   AWAIT_READY(operationDroppedStatus);
   EXPECT_EQ(OPERATION_DROPPED, operationDroppedStatus->status().state());

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/create_disk/finished")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/create_disk/finished")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/failed")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/destroy_disk/failed")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "operations/destroy_disk/dropped")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "operations/destroy_disk/dropped")));
 }


 // This test verifies that storage local resource provider properly
 // reports metrics related to RPCs to CSI plugins.
 // TODO(chhsiao): Currently there is no way to test the `pending` and
 // `cancelled` metrics for RPCs since we have no control over the completion of
 // an operation. Once we support out-of-band CSI plugins through domain sockets,
 // we could test these metrics against a mock CSI plugin.
 TEST_F(StorageLocalResourceProviderTest, ROOT_CsiPluginRpcMetrics)
 {
   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   masterFlags.allocation_interval = Milliseconds(50);

   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), slaveFlags);
   ASSERT_SOME(slave);

   AWAIT_READY(slaveRegisteredMessage);

   // Register a framework to exercise operations.
   FrameworkInfo framework = DEFAULT_FRAMEWORK_INFO;
   framework.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, framework, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // The framework is expected to see the following offers in sequence:
   //   1. One containing a RAW disk resource before `CREATE_DISK`.
   //   2. One containing a MOUNT disk resource after `CREATE_DISK`.
   //   3. One containing the same MOUNT disk resource after a failed
   //      `DESTROY_DISK`.
   //
   // We set up the expectations for these offers as the test progresses.
   Future<vector<Offer>> rawDiskOffers;
   Future<vector<Offer>> volumeCreatedOffers;
   Future<vector<Offer>> operationFailedOffers;

   Sequence offers;

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that contain only the agent's default resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   // We are only interested in any storage pool or volume with a "test" profile.
   auto hasSourceType = [](
       const Resource& r,
       const Resource::DiskInfo::Source::Type& type) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().profile() == "test" &&
       r.disk().source().type() == type;
   };

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::RAW))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&rawDiskOffers));

   driver.start();

   AWAIT_READY(rawDiskOffers);
   ASSERT_FALSE(rawDiskOffers->empty());

   Option<Resource> source;

   foreach (const Resource& resource, rawDiskOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::RAW)) {
       source = resource;
       break;
     }
   }

   ASSERT_SOME(source);

   JSON::Object snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   EXPECT_EQ(1, snapshot.values.at( metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   EXPECT_EQ(2, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));

   // Create a volume.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(
       std::bind(hasSourceType, lambda::_1, Resource::DiskInfo::Source::MOUNT))))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&volumeCreatedOffers));

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   driver.acceptOffers(
       {rawDiskOffers->at(0).id()},
       {CREATE_DISK(source.get(), Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   AWAIT_READY(volumeCreatedOffers);
   ASSERT_FALSE(volumeCreatedOffers->empty());

   Option<Resource> volume;

   foreach (const Resource& resource, volumeCreatedOffers->at(0).resources()) {
     if (hasSourceType(resource, Resource::DiskInfo::Source::MOUNT)) {
       volume = resource;
       break;
     }
   }

   ASSERT_SOME(volume);
   ASSERT_TRUE(volume->disk().source().has_id());
   ASSERT_TRUE(volume->disk().source().has_metadata());
   ASSERT_TRUE(volume->disk().source().has_mount());
   ASSERT_TRUE(volume->disk().source().mount().has_root());
   EXPECT_FALSE(path::absolute(volume->disk().source().mount().root()));

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   EXPECT_EQ(1, snapshot.values.at( metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   EXPECT_EQ(2, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   EXPECT_EQ(0, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));

   // Remove the volume out of band to fail `DESTROY_DISK`.
   Option<string> volumePath;

   foreach (const Label& label, volume->disk().source().metadata().labels()) {
     if (label.key() == "path") {
       volumePath = label.value();
       break;
     }
   }

   ASSERT_SOME(volumePath);
   ASSERT_SOME(os::rmdir(volumePath.get()));

   // Destroy the created volume, which will fail.
   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveResource(volume.get())))
     .InSequence(offers)
     .WillOnce(FutureArg<1>(&operationFailedOffers))
     .WillRepeatedly(DeclineOffers(declineFilters)); // Decline further offers.

   driver.acceptOffers(
       {volumeCreatedOffers->at(0).id()},
       {DESTROY_DISK(volume.get())},
       acceptFilters);

   AWAIT_READY(operationFailedOffers);
   ASSERT_FALSE(operationFailedOffers->empty());

   snapshot = Metrics();

   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   EXPECT_EQ(1, snapshot.values.at( metricName(
       "csi_plugin/rpcs/csi.v0.Identity.Probe/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   EXPECT_EQ(2, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginInfo/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Identity.GetPluginCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ControllerGetCapabilities/successes"))); // NOLINT(whitespace/line_length)
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.ListVolumes/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.GetCapacity/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.CreateVolume/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Controller.DeleteVolume/errors")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetCapabilities/successes")));
   ASSERT_NE(0u, snapshot.values.count(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));
   EXPECT_EQ(1, snapshot.values.at(metricName(
       "csi_plugin/rpcs/csi.v0.Node.NodeGetId/successes")));
 }


 // Master reconciles operations that are missing from a reregistering slave.
 // In this case, one of the two `ApplyOperationMessage`s is dropped, so the
 // resource provider should send only one OPERATION_DROPPED.
 //
 // TODO(greggomann): Test operations on agent default resources: for such
 // operations, the agent generates the dropped status.
 TEST_F(StorageLocalResourceProviderTest, ROOT_ReconcileDroppedOperation)
 {
   Clock::pause();

   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   StandaloneMasterDetector detector(master.get()->pid);

   slave::Flags slaveFlags = CreateSlaveFlags();
   slaveFlags.isolation = "filesystem/linux";

   slaveFlags.resource_provider_config_dir = resourceProviderConfigDir;
   slaveFlags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   Future<SlaveRegisteredMessage> slaveRegisteredMessage =
     FUTURE_PROTOBUF(SlaveRegisteredMessage(), _, _);

   // Since the local resource provider daemon is started after the agent is
   // registered, it is guaranteed that the agent will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from the
   // storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(&detector, slaveFlags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(slaveRegisteredMessage);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by the
   // plugin container, which runs in another Linux process. Since we do not have
   // a `Future` linked to the standalone container launch to await on, it is
   // difficult to accomplish this without resuming the clock.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Clock::pause();

   FrameworkInfo frameworkInfo = DEFAULT_FRAMEWORK_INFO;
   frameworkInfo.set_roles(0, "storage");

   MockScheduler sched;
   MesosSchedulerDriver driver(
       &sched, frameworkInfo, master.get()->pid, DEFAULT_CREDENTIAL);

   EXPECT_CALL(sched, registered(&driver, _, _));

   // We use the following filter to filter offers that do not have
   // wanted resources for 365 days (the maximum).
   Filters declineFilters;
   declineFilters.set_refuse_seconds(Days(365).secs());

   // Decline offers that do not contain wanted resources.
   EXPECT_CALL(sched, resourceOffers(&driver, _))
     .WillRepeatedly(DeclineOffers(declineFilters));

   auto isRaw = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == Resource::DiskInfo::Source::RAW;
   };

   Future<vector<Offer>> offersBeforeOperations;

   EXPECT_CALL(sched, resourceOffers(&driver, OffersHaveAnyResource(isRaw)))
     .WillOnce(FutureArg<1>(&offersBeforeOperations))
     .WillRepeatedly(DeclineOffers(declineFilters)); // Decline further offers.

   driver.start();

   AWAIT_READY(offersBeforeOperations);
   ASSERT_EQ(1u, offersBeforeOperations->size());

   Resources raw =
     Resources(offersBeforeOperations->at(0).resources()).filter(isRaw);

   // Create two MOUNT disks of 2GB each.
   ASSERT_SOME_EQ(Gigabytes(4), raw.disk());
   Resource source1 = *raw.begin();
   source1.mutable_scalar()->set_value(
       static_cast<double>(Gigabytes(2).bytes()) / Bytes::MEGABYTES);
   Resource source2 = *(raw - source1).begin();

   // Drop one of the operations on the way to the agent.
   Future<ApplyOperationMessage> applyOperationMessage =
     DROP_PROTOBUF(ApplyOperationMessage(), _, _);

   // The successful operation will result in a terminal update.
   Future<UpdateOperationStatusMessage> operationFinishedStatus =
     FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

   // We use the following filter so that the resources will not be
   // filtered for 5 seconds (the default).
   Filters acceptFilters;
   acceptFilters.set_refuse_seconds(0);

   // Attempt the creation of two volumes.
   driver.acceptOffers(
       {offersBeforeOperations->at(0).id()},
       {CREATE_DISK(source1, Resource::DiskInfo::Source::MOUNT),
        CREATE_DISK(source2, Resource::DiskInfo::Source::MOUNT)},
       acceptFilters);

   // Ensure that the operations are processed.
   Clock::settle();

   AWAIT_READY(applyOperationMessage);
   AWAIT_READY(operationFinishedStatus);

   Future<SlaveReregisteredMessage> slaveReregisteredMessage =
     FUTURE_PROTOBUF(SlaveReregisteredMessage(), _, _);

   // Observe explicit operation reconciliation between master and agent.
   Future<ReconcileOperationsMessage> reconcileOperationsMessage =
     FUTURE_PROTOBUF(ReconcileOperationsMessage(), _, _);
   Future<UpdateOperationStatusMessage> operationDroppedStatus =
     FUTURE_PROTOBUF(UpdateOperationStatusMessage(), _, _);

   // The master may send an offer with the agent's resources after the agent
   // reregisters, but before an `UpdateSlaveMessage` is sent containing the
   // resource provider's resources. In this case, the offer will be rescinded.
   EXPECT_CALL(sched, offerRescinded(&driver, _))
     .Times(AtMost(1));

   // Simulate a spurious master change event (e.g., due to ZooKeeper
   // expiration) at the slave to force re-registration.
   detector.appoint(master.get()->pid);

   // Advance the clock to trigger agent registration.
   Clock::advance(slaveFlags.registration_backoff_factor);

   AWAIT_READY(slaveReregisteredMessage);
   AWAIT_READY(reconcileOperationsMessage);
   AWAIT_READY(operationDroppedStatus);

   std::set<OperationState> expectedStates =
     {OperationState::OPERATION_DROPPED,
      OperationState::OPERATION_FINISHED};

   std::set<OperationState> observedStates =
     {operationFinishedStatus->status().state(),
      operationDroppedStatus->status().state()};

   ASSERT_EQ(expectedStates, observedStates);

   Future<vector<Offer>> offersAfterOperations;

   auto isMountDisk = [](const Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == Resource::DiskInfo::Source::MOUNT;
   };

   EXPECT_CALL(
       sched, resourceOffers(&driver, OffersHaveAnyResource(isMountDisk)))
     .WillOnce(FutureArg<1>(&offersAfterOperations));

   // Advance the clock to trigger a batch allocation.
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offersAfterOperations);
   ASSERT_FALSE(offersAfterOperations->empty());

   Resources converted =
     Resources(offersAfterOperations->at(0).resources()).filter(isMountDisk);

   ASSERT_EQ(1u, converted.size());

   // TODO(greggomann): Add inspection of dropped operation metrics here once
   // such metrics have been added. See MESOS-8406.

   // Settle the clock to ensure that unexpected messages will cause errors.
   Clock::settle();

   driver.stop();
   driver.join();
 }


 // This test verifies that if an operation ID is specified, operation status
 // updates are resent to the scheduler until acknowledged.
 TEST_F(
     StorageLocalResourceProviderTest,
     ROOT_RetryOperationStatusUpdateToScheduler)
 {
   Clock::pause();

   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags flags = CreateSlaveFlags();
   flags.isolation = "filesystem/linux";

   flags.resource_provider_config_dir = resourceProviderConfigDir;
   flags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), flags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(flags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Clock::pause();

   // Register a framework to exercise an operation.
   v1::FrameworkInfo frameworkInfo = v1::DEFAULT_FRAMEWORK_INFO;
   frameworkInfo.set_roles(0, "storage");

   auto scheduler = std::make_shared<v1::MockHTTPScheduler>();

   EXPECT_CALL(*scheduler, connected(_))
     .WillOnce(v1::scheduler::SendSubscribe(frameworkInfo));

   Future<v1::scheduler::Event::Subscribed> subscribed;
   EXPECT_CALL(*scheduler, subscribed(_, _))
     .WillOnce(FutureArg<1>(&subscribed));

   EXPECT_CALL(*scheduler, heartbeat(_))
     .WillRepeatedly(Return()); // Ignore heartbeats.

   // Decline offers that do not contain wanted resources.
   EXPECT_CALL(*scheduler, offers(_, _))
     .WillRepeatedly(v1::scheduler::DeclineOffers());

   Future<v1::scheduler::Event::Offers> offers;

   auto isRaw = [](const v1::Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == v1::Resource::DiskInfo::Source::RAW;
   };

   EXPECT_CALL(
       *scheduler, offers(_, v1::scheduler::OffersHaveAnyResource(isRaw)))
     .WillOnce(FutureArg<1>(&offers));

   v1::scheduler::TestMesos mesos(
       master.get()->pid,
       ContentType::PROTOBUF,
       scheduler);

   AWAIT_READY(subscribed);
   v1::FrameworkID frameworkId(subscribed->framework_id());

   // NOTE: If the framework has not declined an unwanted offer yet when
   // the master updates the agent with the RAW disk resource, the new
   // allocation triggered by this update won't generate an allocatable
   // offer due to no CPU and memory resources. So here we first settle
   // the clock to ensure that the unwanted offer has been declined, then
   // advance the clock to trigger another allocation.
   Clock::settle();
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offers);
   ASSERT_FALSE(offers->offers().empty());

   const v1::Offer& offer = offers->offers(0);

   Option<v1::Resource> source;
   Option<mesos::v1::ResourceProviderID> resourceProviderId;
   foreach (const v1::Resource& resource, offer.resources()) {
     if (isRaw(resource)) {
       source = resource;

       ASSERT_TRUE(resource.has_provider_id());
       resourceProviderId = resource.provider_id();

       break;
     }
   }

   ASSERT_SOME(source);
   ASSERT_SOME(resourceProviderId);

   Future<v1::scheduler::Event::UpdateOperationStatus> update;
   Future<v1::scheduler::Event::UpdateOperationStatus> retriedUpdate;

   EXPECT_CALL(*scheduler, updateOperationStatus(_, _))
     .WillOnce(FutureArg<1>(&update))
     .WillOnce(FutureArg<1>(&retriedUpdate));

   // Create a volume.
   const string operationId = "operation";
   mesos.send(v1::createCallAccept(
       frameworkId,
       offer,
       {v1::CREATE_DISK(
            source.get(),
            v1::Resource::DiskInfo::Source::MOUNT,
            None(),
            operationId)}));

   AWAIT_READY(update);

   ASSERT_EQ(operationId, update->status().operation_id().value());
   ASSERT_EQ(
       mesos::v1::OperationState::OPERATION_FINISHED, update->status().state());
   ASSERT_TRUE(update->status().has_uuid());

   ASSERT_TRUE(retriedUpdate.isPending());

   Clock::advance(slave::STATUS_UPDATE_RETRY_INTERVAL_MIN);
   Clock::settle();

   // The scheduler didn't acknowledge the operation status update, so the SLRP
   // should resend it after the status update retry interval minimum.
   AWAIT_READY(retriedUpdate);

   ASSERT_EQ(operationId, retriedUpdate->status().operation_id().value());
   ASSERT_EQ(
       mesos::v1::OperationState::OPERATION_FINISHED,
       retriedUpdate->status().state());
   ASSERT_TRUE(retriedUpdate->status().has_uuid());

   // The scheduler will acknowledge the operation status update, so the agent
   // should receive an acknowledgement.
   Future<AcknowledgeOperationStatusMessage> acknowledgeOperationStatusMessage =
     FUTURE_PROTOBUF(
       AcknowledgeOperationStatusMessage(), master.get()->pid, slave.get()->pid);

   mesos.send(v1::createCallAcknowledgeOperationStatus(
       frameworkId, offer.agent_id(), resourceProviderId.get(), update.get()));

   AWAIT_READY(acknowledgeOperationStatusMessage);

   // Now that the SLRP has received the acknowledgement, the SLRP shouldn't
   // send further operation status updates.
   EXPECT_NO_FUTURE_PROTOBUFS(UpdateOperationStatusMessage(), _, _);

   Clock::advance(slave::STATUS_UPDATE_RETRY_INTERVAL_MIN);
   Clock::settle();
 }


 // This test ensures that the master responds with the latest state
 // for operations that are terminal at the master, but have not been
 // acknowledged by the framework.
 TEST_F(
     StorageLocalResourceProviderTest,
     ROOT_ReconcileUnacknowledgedTerminalOperation)
 {
   Clock::pause();

   const string profilesPath = path::join(sandbox.get(), "profiles.json");
   ASSERT_SOME(os::write(profilesPath, createDiskProfileMapping("test")));
   loadUriDiskProfileAdaptorModule(profilesPath);

   setupResourceProviderConfig(Gigabytes(4));

   master::Flags masterFlags = CreateMasterFlags();
   Try<Owned<cluster::Master>> master = StartMaster(masterFlags);
   ASSERT_SOME(master);

   Owned<MasterDetector> detector = master.get()->createDetector();

   slave::Flags flags = CreateSlaveFlags();
   flags.isolation = "filesystem/linux";

   flags.resource_provider_config_dir = resourceProviderConfigDir;
   flags.disk_profile_adaptor = URI_DISK_PROFILE_ADAPTOR_NAME;

   // Since the local resource provider daemon is started after the agent
   // is registered, it is guaranteed that the slave will send two
   // `UpdateSlaveMessage`s, where the latter one contains resources from
   // the storage local resource provider.
   //
   // NOTE: The order of the two `FUTURE_PROTOBUF`s is reversed because
   // Google Mock will search the expectations in reverse order.
   Future<UpdateSlaveMessage> updateSlave2 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);
   Future<UpdateSlaveMessage> updateSlave1 =
     FUTURE_PROTOBUF(UpdateSlaveMessage(), _, _);

   Try<Owned<cluster::Slave>> slave = StartSlave(detector.get(), flags);
   ASSERT_SOME(slave);

   // Advance the clock to trigger agent registration.
   Clock::advance(flags.registration_backoff_factor);

   AWAIT_READY(updateSlave1);

   // NOTE: We need to resume the clock so that the resource provider can
   // periodically check if the CSI endpoint socket has been created by
   // the plugin container, which runs in another Linux process.
   Clock::resume();

   AWAIT_READY(updateSlave2);
   ASSERT_TRUE(updateSlave2->has_resource_providers());
   ASSERT_EQ(1, updateSlave2->resource_providers().providers_size());

   Clock::pause();

   // Register a framework to exercise an operation.
   v1::FrameworkInfo frameworkInfo = v1::DEFAULT_FRAMEWORK_INFO;
   frameworkInfo.set_roles(0, "storage");

   auto scheduler = std::make_shared<v1::MockHTTPScheduler>();

   EXPECT_CALL(*scheduler, connected(_))
     .WillOnce(v1::scheduler::SendSubscribe(frameworkInfo));

   Future<v1::scheduler::Event::Subscribed> subscribed;
   EXPECT_CALL(*scheduler, subscribed(_, _))
     .WillOnce(FutureArg<1>(&subscribed));

   EXPECT_CALL(*scheduler, heartbeat(_))
     .WillRepeatedly(Return()); // Ignore heartbeats.

   // Decline offers that do not contain wanted resources.
   EXPECT_CALL(*scheduler, offers(_, _))
     .WillRepeatedly(v1::scheduler::DeclineOffers());

   Future<v1::scheduler::Event::Offers> offers;

   auto isRaw = [](const v1::Resource& r) {
     return r.has_disk() &&
       r.disk().has_source() &&
       r.disk().source().has_profile() &&
       r.disk().source().type() == v1::Resource::DiskInfo::Source::RAW;
   };

   EXPECT_CALL(
       *scheduler, offers(_, v1::scheduler::OffersHaveAnyResource(isRaw)))
     .WillOnce(FutureArg<1>(&offers));

   v1::scheduler::TestMesos mesos(
       master.get()->pid,
       ContentType::PROTOBUF,
       scheduler);

   AWAIT_READY(subscribed);
   v1::FrameworkID frameworkId(subscribed->framework_id());

   // NOTE: If the framework has not declined an unwanted offer yet when
   // the master updates the agent with the RAW disk resource, the new
   // allocation triggered by this update won't generate an allocatable
   // offer due to no CPU and memory resources. So here we first settle
   // the clock to ensure that the unwanted offer has been declined, then
   // advance the clock to trigger another allocation.
   Clock::settle();
   Clock::advance(masterFlags.allocation_interval);

   AWAIT_READY(offers);
   ASSERT_FALSE(offers->offers().empty());

   const v1::Offer& offer = offers->offers(0);
   const v1::AgentID& agentId = offer.agent_id();

   Future<v1::scheduler::Event::UpdateOperationStatus> update;
   EXPECT_CALL(*scheduler, updateOperationStatus(_, _))
     .WillOnce(FutureArg<1>(&update));

   Option<v1::Resource> source;
   Option<mesos::v1::ResourceProviderID> resourceProviderId;
   foreach (const v1::Resource& resource, offer.resources()) {
     if (isRaw(resource)) {
       source = resource;

       ASSERT_TRUE(resource.has_provider_id());
       resourceProviderId = resource.provider_id();

       break;
     }
   }

   ASSERT_SOME(source);
   ASSERT_SOME(resourceProviderId);

   v1::OperationID operationId;
   operationId.set_value("operation");

   mesos.send(v1::createCallAccept(
       frameworkId,
       offer,
       {v1::CREATE_DISK(
           source.get(),
           v1::Resource::DiskInfo::Source::MOUNT,
           None(),
           operationId.value())}));

   AWAIT_READY(update);

   ASSERT_EQ(operationId, update->status().operation_id());
   ASSERT_EQ(v1::OperationState::OPERATION_FINISHED, update->status().state());
   ASSERT_TRUE(update->status().has_uuid());

   v1::scheduler::Call::ReconcileOperations::Operation operation;
   operation.mutable_operation_id()->CopyFrom(operationId);
   operation.mutable_agent_id()->CopyFrom(agentId);

   const Future<v1::scheduler::APIResult> result =
     mesos.call({v1::createCallReconcileOperations(frameworkId, {operation})});

   AWAIT_READY(result);

   // The master should respond with '200 OK' and with a `scheduler::Response`.
   ASSERT_EQ(process::http::Status::OK, result->status_code());
   ASSERT_TRUE(result->has_response());

   const v1::scheduler::Response response = result->response();
   ASSERT_EQ(v1::scheduler::Response::RECONCILE_OPERATIONS, response.type());
   ASSERT_TRUE(response.has_reconcile_operations());

   const v1::scheduler::Response::ReconcileOperations& reconcile =
     response.reconcile_operations();
   ASSERT_EQ(1, reconcile.operation_statuses_size());

   const v1::OperationStatus& operationStatus = reconcile.operation_statuses(0);
   ASSERT_EQ(operationId, operationStatus.operation_id());
   ASSERT_EQ(v1::OPERATION_FINISHED, operationStatus.state());
   ASSERT_TRUE(operationStatus.has_uuid());
 }

 } // namespace tests {
 } // namespace internal {
 } // namespace mesos {