| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.hadoop.hdfs.server.namenode; |
| |
| import junit.framework.TestCase; |
| |
| import org.apache.hadoop.conf.Configuration; |
| import org.apache.hadoop.fs.FileStatus; |
| import org.apache.hadoop.fs.FileSystem; |
| import org.apache.hadoop.fs.Path; |
| import org.apache.hadoop.hdfs.server.common.Storage.StorageDirectory; |
| import org.apache.hadoop.hdfs.DFSConfigKeys; |
| import org.apache.hadoop.hdfs.MiniDFSCluster; |
| import org.apache.hadoop.hdfs.DFSTestUtil; |
| import org.apache.hadoop.hdfs.HdfsConfiguration; |
| import org.apache.hadoop.hdfs.protocol.HdfsConstants.SafeModeAction; |
| import org.apache.hadoop.hdfs.server.namenode.NNStorage.NameNodeDirType; |
| |
| import java.util.Collections; |
| import java.util.List; |
| |
| import java.io.File; |
| |
| /** |
| * A JUnit test for checking if restarting DFS preserves integrity. |
| * Specifically with FSImage being written in parallel |
| */ |
| public class TestParallelImageWrite extends TestCase { |
| private static final int NUM_DATANODES = 4; |
| /** check if DFS remains in proper condition after a restart */ |
| public void testRestartDFS() throws Exception { |
| final Configuration conf = new HdfsConfiguration(); |
| MiniDFSCluster cluster = null; |
| FSNamesystem fsn = null; |
| int numNamenodeDirs; |
| DFSTestUtil files = new DFSTestUtil("TestRestartDFS", 200, 3, 8*1024); |
| |
| final String dir = "/srcdat"; |
| final Path rootpath = new Path("/"); |
| final Path dirpath = new Path(dir); |
| |
| long rootmtime; |
| FileStatus rootstatus; |
| FileStatus dirstatus; |
| |
| try { |
| cluster = new MiniDFSCluster.Builder(conf).format(true) |
| .numDataNodes(NUM_DATANODES).build(); |
| String[] nameNodeDirs = conf.getStrings( |
| DFSConfigKeys.DFS_NAMENODE_NAME_DIR_KEY, new String[] {}); |
| numNamenodeDirs = nameNodeDirs.length; |
| assertTrue("failed to get number of Namenode StorageDirs", |
| numNamenodeDirs != 0); |
| FileSystem fs = cluster.getFileSystem(); |
| files.createFiles(fs, dir); |
| |
| rootmtime = fs.getFileStatus(rootpath).getModificationTime(); |
| rootstatus = fs.getFileStatus(dirpath); |
| dirstatus = fs.getFileStatus(dirpath); |
| |
| fs.setOwner(rootpath, rootstatus.getOwner() + "_XXX", null); |
| fs.setOwner(dirpath, null, dirstatus.getGroup() + "_XXX"); |
| } finally { |
| if (cluster != null) { cluster.shutdown(); } |
| } |
| try { |
| // Force the NN to save its images on startup so long as |
| // there are any uncheckpointed txns |
| conf.setInt(DFSConfigKeys.DFS_NAMENODE_CHECKPOINT_TXNS_KEY, 1); |
| |
| // Here we restart the MiniDFScluster without formatting namenode |
| cluster = new MiniDFSCluster.Builder(conf).format(false) |
| .numDataNodes(NUM_DATANODES).build(); |
| fsn = cluster.getNamesystem(); |
| FileSystem fs = cluster.getFileSystem(); |
| assertTrue("Filesystem corrupted after restart.", |
| files.checkFiles(fs, dir)); |
| |
| final FileStatus newrootstatus = fs.getFileStatus(rootpath); |
| assertEquals(rootmtime, newrootstatus.getModificationTime()); |
| assertEquals(rootstatus.getOwner() + "_XXX", newrootstatus.getOwner()); |
| assertEquals(rootstatus.getGroup(), newrootstatus.getGroup()); |
| |
| final FileStatus newdirstatus = fs.getFileStatus(dirpath); |
| assertEquals(dirstatus.getOwner(), newdirstatus.getOwner()); |
| assertEquals(dirstatus.getGroup() + "_XXX", newdirstatus.getGroup()); |
| rootmtime = fs.getFileStatus(rootpath).getModificationTime(); |
| |
| final String checkAfterRestart = checkImages(fsn, numNamenodeDirs); |
| |
| // Modify the system and then perform saveNamespace |
| files.cleanup(fs, dir); |
| files.createFiles(fs, dir); |
| fsn.setSafeMode(SafeModeAction.SAFEMODE_ENTER); |
| cluster.getNameNodeRpc().saveNamespace(); |
| final String checkAfterModify = checkImages(fsn, numNamenodeDirs); |
| assertFalse("Modified namespace should change fsimage contents. " + |
| "was: " + checkAfterRestart + " now: " + checkAfterModify, |
| checkAfterRestart.equals(checkAfterModify)); |
| fsn.setSafeMode(SafeModeAction.SAFEMODE_LEAVE); |
| files.cleanup(fs, dir); |
| } finally { |
| if (cluster != null) { cluster.shutdown(); } |
| } |
| } |
| |
| /** |
| * Confirm that FSImage files in all StorageDirectory are the same, |
| * and non-empty, and there are the expected number of them. |
| * @param fsn - the FSNamesystem being checked. |
| * @param numImageDirs - the configured number of StorageDirectory of type IMAGE. |
| * @return - the md5 hash of the most recent FSImage files, which must all be the same. |
| * @throws AssertionFailedError if image files are empty or different, |
| * if less than two StorageDirectory are provided, or if the |
| * actual number of StorageDirectory is less than configured. |
| */ |
| public static String checkImages( |
| FSNamesystem fsn, int numImageDirs) |
| throws Exception { |
| NNStorage stg = fsn.getFSImage().getStorage(); |
| //any failed StorageDirectory is removed from the storageDirs list |
| assertEquals("Some StorageDirectories failed Upgrade", |
| numImageDirs, stg.getNumStorageDirs(NameNodeDirType.IMAGE)); |
| assertTrue("Not enough fsimage copies in MiniDFSCluster " + |
| "to test parallel write", numImageDirs > 1); |
| |
| // List of "current/" directory from each SD |
| List<File> dirs = FSImageTestUtil.getCurrentDirs(stg, NameNodeDirType.IMAGE); |
| |
| // across directories, all files with same names should be identical hashes |
| FSImageTestUtil.assertParallelFilesAreIdentical( |
| dirs, Collections.<String>emptySet()); |
| FSImageTestUtil.assertSameNewestImage(dirs); |
| |
| // Return the hash of the newest image file |
| StorageDirectory firstSd = stg.dirIterator(NameNodeDirType.IMAGE).next(); |
| File latestImage = FSImageTestUtil.findLatestImageFile(firstSd); |
| String md5 = FSImageTestUtil.getImageFileMD5IgnoringTxId(latestImage); |
| System.err.println("md5 of " + latestImage + ": " + md5); |
| return md5; |
| } |
| } |
| |