blob: a37da35a893731942c40dd2db2fe0c39cf85a577 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hdfs;
import static org.junit.Assert.assertTrue;
import java.io.IOException;
import java.util.Arrays;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.CommonConfigurationKeys;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.junit.Test;
/**
* This class tests that blocks can be larger than 2GB
*/
public class TestLargeBlock {
/**
{
GenericTestUtils.setLogLevel(DataNode.LOG, Level.ALL);
GenericTestUtils.setLogLevel(LeaseManager.LOG, Level.ALL);
GenericTestUtils.setLogLevel(FSNamesystem.LOG, Level.ALL);
GenericTestUtils.setLogLevel(DFSClient.LOG, Level.ALL);
GenericTestUtils.setLogLevel(TestLargeBlock.LOG, Level.ALL);
}
*/
private static final Log LOG = LogFactory.getLog(TestLargeBlock.class);
// should we verify the data read back from the file? (slow)
static final boolean verifyData = true;
static final byte[] pattern = { 'D', 'E', 'A', 'D', 'B', 'E', 'E', 'F'};
// creates a file
static FSDataOutputStream createFile(FileSystem fileSys, Path name, int repl,
final long blockSize)
throws IOException {
FSDataOutputStream stm = fileSys.create(name, true, fileSys.getConf()
.getInt(CommonConfigurationKeys.IO_FILE_BUFFER_SIZE_KEY, 4096),
(short) repl, blockSize);
LOG.info("createFile: Created " + name + " with " + repl + " replica.");
return stm;
}
/**
* Writes pattern to file
* @param stm FSDataOutputStream to write the file
* @param fileSize size of the file to be written
* @throws IOException in case of errors
*/
static void writeFile(FSDataOutputStream stm, final long fileSize)
throws IOException {
// write in chunks of 64 MB
final int writeSize = pattern.length * 8 * 1024 * 1024;
if (writeSize > Integer.MAX_VALUE) {
throw new IOException("A single write is too large " + writeSize);
}
long bytesToWrite = fileSize;
byte[] b = new byte[writeSize];
// initialize buffer
for (int j = 0; j < writeSize; j++) {
b[j] = pattern[j % pattern.length];
}
while (bytesToWrite > 0) {
// how many bytes we are writing in this iteration
int thiswrite = (int) Math.min(writeSize, bytesToWrite);
stm.write(b, 0, thiswrite);
bytesToWrite -= thiswrite;
}
}
/**
* Reads from file and makes sure that it matches the pattern
* @param fs a reference to FileSystem
* @param name Path of a file
* @param fileSize size of the file
* @throws IOException in case of errors
*/
static void checkFullFile(FileSystem fs, Path name, final long fileSize)
throws IOException {
// read in chunks of 128 MB
final int readSize = pattern.length * 16 * 1024 * 1024;
if (readSize > Integer.MAX_VALUE) {
throw new IOException("A single read is too large " + readSize);
}
byte[] b = new byte[readSize];
long bytesToRead = fileSize;
byte[] compb = new byte[readSize]; // buffer with correct data for comparison
if (verifyData) {
// initialize compare buffer
for (int j = 0; j < readSize; j++) {
compb[j] = pattern[j % pattern.length];
}
}
FSDataInputStream stm = fs.open(name);
while (bytesToRead > 0) {
// how many bytes we are reading in this iteration
int thisread = (int) Math.min(readSize, bytesToRead);
stm.readFully(b, 0, thisread);
if (verifyData) {
// verify data read
if (thisread == readSize) {
assertTrue("file is corrupted at or after byte " +
(fileSize - bytesToRead), Arrays.equals(b, compb));
} else {
// b was only partially filled by last read
for (int k = 0; k < thisread; k++) {
assertTrue("file is corrupted at or after byte " +
(fileSize - bytesToRead), b[k] == compb[k]);
}
}
}
LOG.debug("Before update: to read: " + bytesToRead +
"; read already: "+ thisread);
bytesToRead -= thisread;
LOG.debug("After update: to read: " + bytesToRead +
"; read already: " + thisread);
}
stm.close();
}
/**
* Test for block size of 2GB + 512B. This test can take a rather long time to
* complete on Windows (reading the file back can be slow) so we use a larger
* timeout here.
* @throws IOException in case of errors
*/
@Test (timeout = 900000)
public void testLargeBlockSize() throws IOException {
final long blockSize = 2L * 1024L * 1024L * 1024L + 512L; // 2GB + 512B
runTest(blockSize);
}
/**
* Test that we can write to and read from large blocks
* @param blockSize size of the block
* @throws IOException in case of errors
*/
public void runTest(final long blockSize) throws IOException {
// write a file that is slightly larger than 1 block
final long fileSize = blockSize + 1L;
Configuration conf = new Configuration();
MiniDFSCluster cluster = new MiniDFSCluster.Builder(conf).build();
FileSystem fs = cluster.getFileSystem();
try {
// create a new file in test data directory
Path file1 = new Path("/tmp/TestLargeBlock", blockSize + ".dat");
FSDataOutputStream stm = createFile(fs, file1, 1, blockSize);
LOG.info("File " + file1 + " created with file size " +
fileSize +
" blocksize " + blockSize);
// verify that file exists in FS namespace
assertTrue(file1 + " should be a file",
fs.getFileStatus(file1).isFile());
// write to file
writeFile(stm, fileSize);
LOG.info("File " + file1 + " written to.");
// close file
stm.close();
LOG.info("File " + file1 + " closed.");
// Make sure a client can read it
checkFullFile(fs, file1, fileSize);
// verify that file size has changed
long len = fs.getFileStatus(file1).getLen();
assertTrue(file1 + " should be of size " + fileSize +
" but found to be of size " + len,
len == fileSize);
} finally {
cluster.shutdown();
}
}
}