blob: d09531879e1350a02eee4158f992fcc6d0ef2c9b [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
import java.util.EnumSet;
import java.util.List;
import java.util.Map;
import java.util.concurrent.ConcurrentMap;
import org.apache.drill.exec.ops.OperatorStats;
import org.apache.drill.exec.util.AssertionUtil;
import org.apache.hadoop.classification.InterfaceAudience.LimitedPrivate;
import org.apache.hadoop.classification.InterfaceAudience.Private;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.BlockLocation;
import org.apache.hadoop.fs.ContentSummary;
import org.apache.hadoop.fs.CreateFlag;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileChecksum;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.FsServerDefaults;
import org.apache.hadoop.fs.FsStatus;
import org.apache.hadoop.fs.LocatedFileStatus;
import org.apache.hadoop.fs.Options.ChecksumOpt;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.PathFilter;
import org.apache.hadoop.fs.RemoteIterator;
import org.apache.hadoop.fs.XAttrSetFlag;
import org.apache.hadoop.fs.permission.AclEntry;
import org.apache.hadoop.fs.permission.AclStatus;
import org.apache.hadoop.fs.permission.FsAction;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.util.Progressable;
* DrillFileSystem is the wrapper around the actual FileSystem implementation. The {@link DrillFileSystem} is
* immutable.
* If {@link org.apache.drill.exec.ops.OperatorStats} are provided it returns an instrumented FSDataInputStream to
* measure IO wait time and tracking file open/close operations.
public class DrillFileSystem extends FileSystem implements OpenFileTracker {
static final org.slf4j.Logger logger = org.slf4j.LoggerFactory.getLogger(DrillFileSystem.class);
private final static boolean TRACKING_ENABLED = AssertionUtil.isAssertionsEnabled();
public static final String UNDERSCORE_PREFIX = "_";
public static final String DOT_PREFIX = ".";
private final ConcurrentMap<DrillFSDataInputStream, DebugStackTrace> openedFiles = Maps.newConcurrentMap();
private final FileSystem underlyingFs;
private final OperatorStats operatorStats;
private final CompressionCodecFactory codecFactory;
public DrillFileSystem(Configuration fsConf) throws IOException {
this(fsConf, null);
public DrillFileSystem(Configuration fsConf, OperatorStats operatorStats) throws IOException {
// Configuration objects are mutable, and the underlying FileSystem object may directly use a passed in Configuration.
// In order to avoid scenarios where a Configuration can change after a DrillFileSystem is created, we make a copy
// of the Configuration.
fsConf = new Configuration(fsConf);
this.underlyingFs = FileSystem.get(fsConf);
this.codecFactory = new CompressionCodecFactory(fsConf);
this.operatorStats = operatorStats;
private void throwUnsupported() {
throw new UnsupportedOperationException(DrillFileSystem.class.getCanonicalName() + " is immutable and should not be changed after creation.");
* This method should never be used on {@link DrillFileSystem} since {@link DrillFileSystem} is immutable.
* {@inheritDoc}
* @throws UnsupportedOperationException when called.
public void setConf(Configuration conf) {
if (underlyingFs != null) {
// The parent class's constructor FileSystem() calls Configured(null) which calls setConf(null).
// We want to let that first call to setConf succeed. Any subsequent calls would be made by a user and are not allowed.
* Returns a copy of {@link Configuration} for this {@link DrillFileSystem}.
* <b>Note: </b> a copy of the {@link Configuration} is returned in order to enforce immutability.
* @return A copy of {@link Configuration} for this {@link DrillFileSystem}.
public Configuration getConf() {
return new Configuration(this.underlyingFs.getConf());
* If OperatorStats are provided return a instrumented {@link org.apache.hadoop.fs.FSDataInputStream}.
public FSDataInputStream open(Path f, int bufferSize) throws IOException {
if (operatorStats == null) {
return, bufferSize);
DrillFSDataInputStream is = new DrillFSDataInputStream(, bufferSize), operatorStats, this);
fileOpened(f, is);
return is;
return new DrillFSDataInputStream(, bufferSize), operatorStats);
* If OperatorStats are provided return a instrumented {@link org.apache.hadoop.fs.FSDataInputStream}.
public FSDataInputStream open(Path f) throws IOException {
if (operatorStats == null) {
DrillFSDataInputStream is = new DrillFSDataInputStream(, operatorStats, this);
fileOpened(f, is);
return is;
return new DrillFSDataInputStream(, operatorStats);
* This method should never be used on {@link DrillFileSystem} since {@link DrillFileSystem} is immutable.
* {@inheritDoc}
* @throws UnsupportedOperationException when called.
public void initialize(URI name, Configuration conf) {
public String getScheme() {
return underlyingFs.getScheme();
public FSDataOutputStream create(Path f) throws IOException {
return underlyingFs.create(f);
public FSDataOutputStream create(Path f, boolean overwrite) throws IOException {
return underlyingFs.create(f, overwrite);
public FSDataOutputStream create(Path f, Progressable progress) throws IOException {
return underlyingFs.create(f, progress);
public FSDataOutputStream create(Path f, short replication) throws IOException {
return underlyingFs.create(f, replication);
public FSDataOutputStream create(Path f, short replication, Progressable progress) throws IOException {
return underlyingFs.create(f, replication, progress);
public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize) throws IOException {
return underlyingFs.create(f, overwrite, bufferSize);
public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, Progressable progress) throws IOException {
return underlyingFs.create(f, overwrite, bufferSize, progress);
public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, short replication,
long blockSize) throws IOException {
return underlyingFs.create(f, overwrite, bufferSize, replication, blockSize);
public FSDataOutputStream create(Path f, boolean overwrite, int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
return underlyingFs.create(f, overwrite, bufferSize, replication, blockSize, progress);
public FileStatus getFileStatus(Path f) throws IOException {
return underlyingFs.getFileStatus(f);
public void createSymlink(Path target, Path link, boolean createParent) throws IOException {
underlyingFs.createSymlink(target, link, createParent);
public FileStatus getFileLinkStatus(Path f) throws IOException {
return underlyingFs.getFileLinkStatus(f);
public boolean supportsSymlinks() {
return underlyingFs.supportsSymlinks();
public Path getLinkTarget(Path f) throws IOException {
return underlyingFs.getLinkTarget(f);
public FileChecksum getFileChecksum(Path f) throws IOException {
return underlyingFs.getFileChecksum(f);
* This method should never be used on {@link DrillFileSystem} since {@link DrillFileSystem} is immutable.
* {@inheritDoc}
* @throws UnsupportedOperationException when called.
public void setVerifyChecksum(boolean verifyChecksum) {
* This method should never be used on {@link DrillFileSystem} since {@link DrillFileSystem} is immutable.
* {@inheritDoc}
* @throws UnsupportedOperationException when called.
public void setWriteChecksum(boolean writeChecksum) {
public FsStatus getStatus() throws IOException {
return underlyingFs.getStatus();
public FsStatus getStatus(Path p) throws IOException {
return underlyingFs.getStatus(p);
public void setPermission(Path p, FsPermission permission) throws IOException {
underlyingFs.setPermission(p, permission);
public void setOwner(Path p, String username, String groupname) throws IOException {
underlyingFs.setOwner(p, username, groupname);
public void setTimes(Path p, long mtime, long atime) throws IOException {
underlyingFs.setTimes(p, mtime, atime);
public Path createSnapshot(Path path, String snapshotName) throws IOException {
return underlyingFs.createSnapshot(path, snapshotName);
public void renameSnapshot(Path path, String snapshotOldName, String snapshotNewName) throws IOException {
underlyingFs.renameSnapshot(path, snapshotOldName, snapshotNewName);
public void deleteSnapshot(Path path, String snapshotName) throws IOException {
underlyingFs.deleteSnapshot(path, snapshotName);
public void modifyAclEntries(Path path, List<AclEntry> aclSpec) throws IOException {
underlyingFs.modifyAclEntries(path, aclSpec);
public void removeAclEntries(Path path, List<AclEntry> aclSpec) throws IOException {
underlyingFs.removeAclEntries(path, aclSpec);
public void removeDefaultAcl(Path path) throws IOException {
public void removeAcl(Path path) throws IOException {
public void setAcl(Path path, List<AclEntry> aclSpec) throws IOException {
underlyingFs.setAcl(path, aclSpec);
public AclStatus getAclStatus(Path path) throws IOException {
return underlyingFs.getAclStatus(path);
public Path getWorkingDirectory() {
return underlyingFs.getWorkingDirectory();
public FSDataOutputStream append(Path f, int bufferSize, Progressable progress) throws IOException {
return underlyingFs.append(f, bufferSize, progress);
public void concat(Path trg, Path[] psrcs) throws IOException {
underlyingFs.concat(trg, psrcs);
public short getReplication(Path src) throws IOException {
return underlyingFs.getReplication(src);
public boolean setReplication(Path src, short replication) throws IOException {
return underlyingFs.setReplication(src, replication);
public boolean mkdirs(Path f, FsPermission permission) throws IOException {
return underlyingFs.mkdirs(f, permission);
public void copyFromLocalFile(Path src, Path dst) throws IOException {
underlyingFs.copyFromLocalFile(src, dst);
public void moveFromLocalFile(Path[] srcs, Path dst) throws IOException {
underlyingFs.moveFromLocalFile(srcs, dst);
public void moveFromLocalFile(Path src, Path dst) throws IOException {
underlyingFs.moveFromLocalFile(src, dst);
public void copyFromLocalFile(boolean delSrc, Path src, Path dst) throws IOException {
underlyingFs.copyFromLocalFile(delSrc, src, dst);
public void copyFromLocalFile(boolean delSrc, boolean overwrite, Path[] srcs, Path dst) throws IOException {
underlyingFs.copyFromLocalFile(delSrc, overwrite, srcs, dst);
public void copyFromLocalFile(boolean delSrc, boolean overwrite, Path src, Path dst) throws IOException {
underlyingFs.copyFromLocalFile(delSrc, overwrite, src, dst);
public void copyToLocalFile(Path src, Path dst) throws IOException {
underlyingFs.copyToLocalFile(src, dst);
public void moveToLocalFile(Path src, Path dst) throws IOException {
underlyingFs.moveToLocalFile(src, dst);
public void copyToLocalFile(boolean delSrc, Path src, Path dst) throws IOException {
underlyingFs.copyToLocalFile(delSrc, src, dst);
public void copyToLocalFile(boolean delSrc, Path src, Path dst, boolean useRawLocalFileSystem) throws IOException {
underlyingFs.copyToLocalFile(delSrc, src, dst, useRawLocalFileSystem);
public Path startLocalOutput(Path fsOutputFile, Path tmpLocalFile) throws IOException {
return underlyingFs.startLocalOutput(fsOutputFile, tmpLocalFile);
public void completeLocalOutput(Path fsOutputFile, Path tmpLocalFile) throws IOException {
underlyingFs.completeLocalOutput(fsOutputFile, tmpLocalFile);
public void close() throws IOException {
if (openedFiles.size() != 0) {
final StringBuffer errMsgBuilder = new StringBuffer();
errMsgBuilder.append(String.format("Not all files opened using this FileSystem are closed. " + "There are" +
" still [%d] files open.\n", openedFiles.size()));
for (DebugStackTrace stackTrace : openedFiles.values()) {
final String errMsg = errMsgBuilder.toString();
throw new IllegalStateException(errMsg);
public long getUsed() throws IOException {
return underlyingFs.getUsed();
public long getBlockSize(Path f) throws IOException {
return underlyingFs.getBlockSize(f);
public long getDefaultBlockSize() {
return underlyingFs.getDefaultBlockSize();
public long getDefaultBlockSize(Path f) {
return underlyingFs.getDefaultBlockSize(f);
public short getDefaultReplication() {
return underlyingFs.getDefaultReplication();
public short getDefaultReplication(Path path) {
return underlyingFs.getDefaultReplication(path);
public boolean mkdirs(Path folderPath) throws IOException {
if (!underlyingFs.exists(folderPath)) {
return underlyingFs.mkdirs(folderPath);
} else if (!underlyingFs.getFileStatus(folderPath).isDir()) {
throw new IOException("The specified folder path exists and is not a folder.");
return false;
public FSDataOutputStream create(Path f, FsPermission permission, EnumSet<CreateFlag> flags, int bufferSize,
short replication, long blockSize, Progressable progress, ChecksumOpt checksumOpt) throws IOException {
return underlyingFs.create(f, permission, flags, bufferSize, replication, blockSize, progress, checksumOpt);
public FSDataOutputStream createNonRecursive(Path f, boolean overwrite, int bufferSize, short replication,
long blockSize, Progressable progress) throws IOException {
return underlyingFs.createNonRecursive(f, overwrite, bufferSize, replication, blockSize, progress);
public FSDataOutputStream createNonRecursive(Path f, FsPermission permission, boolean overwrite, int bufferSize,
short replication, long blockSize, Progressable progress) throws IOException {
return underlyingFs.createNonRecursive(f, permission, overwrite, bufferSize, replication, blockSize, progress);
public FSDataOutputStream createNonRecursive(Path f, FsPermission permission, EnumSet<CreateFlag> flags, int bufferSize, short replication, long blockSize, Progressable progress) throws IOException {
return underlyingFs.createNonRecursive(f, permission, flags, bufferSize, replication, blockSize, progress);
public boolean createNewFile(Path f) throws IOException {
return underlyingFs.createNewFile(f);
public FSDataOutputStream append(Path f) throws IOException {
return underlyingFs.append(f);
public FSDataOutputStream append(Path f, int bufferSize) throws IOException {
return underlyingFs.append(f, bufferSize);
public FSDataOutputStream create(Path f, FsPermission permission, boolean overwrite, int bufferSize, short
replication, long blockSize, Progressable progress) throws IOException {
return underlyingFs.create(f, permission, overwrite, bufferSize, replication, blockSize, progress);
public FSDataOutputStream create(Path f, FsPermission permission, EnumSet<CreateFlag> flags, int bufferSize,
short replication, long blockSize, Progressable progress) throws IOException {
return underlyingFs.create(f, permission, flags, bufferSize, replication, blockSize, progress);
public FileStatus[] listStatus(Path f) throws FileNotFoundException, IOException {
return underlyingFs.listStatus(f);
public RemoteIterator<Path> listCorruptFileBlocks(Path path) throws IOException {
return underlyingFs.listCorruptFileBlocks(path);
public FileStatus[] listStatus(Path f, PathFilter filter) throws FileNotFoundException, IOException {
return underlyingFs.listStatus(f, filter);
public FileStatus[] listStatus(Path[] files) throws FileNotFoundException, IOException {
return underlyingFs.listStatus(files);
public FileStatus[] listStatus(Path[] files, PathFilter filter) throws FileNotFoundException, IOException {
return underlyingFs.listStatus(files, filter);
public FileStatus[] globStatus(Path pathPattern) throws IOException {
return underlyingFs.globStatus(pathPattern);
public FileStatus[] globStatus(Path pathPattern, PathFilter filter) throws IOException {
return underlyingFs.globStatus(pathPattern, filter);
public RemoteIterator<LocatedFileStatus> listLocatedStatus(Path f) throws FileNotFoundException, IOException {
return underlyingFs.listLocatedStatus(f);
public RemoteIterator<LocatedFileStatus> listFiles(Path f, boolean recursive) throws FileNotFoundException, IOException {
return underlyingFs.listFiles(f, recursive);
public Path getHomeDirectory() {
return underlyingFs.getHomeDirectory();
* This method should never be used on {@link DrillFileSystem} since {@link DrillFileSystem} is immutable.
* {@inheritDoc}
* @throws UnsupportedOperationException when called.
public void setWorkingDirectory(Path new_dir) {
public boolean rename(Path src, Path dst) throws IOException {
return underlyingFs.rename(src, dst);
public boolean delete(Path f) throws IOException {
return underlyingFs.delete(f);
public boolean delete(Path f, boolean recursive) throws IOException {
return underlyingFs.delete(f, recursive);
public boolean deleteOnExit(Path f) throws IOException {
return underlyingFs.deleteOnExit(f);
public boolean cancelDeleteOnExit(Path f) {
return underlyingFs.cancelDeleteOnExit(f);
public boolean exists(Path f) throws IOException {
return underlyingFs.exists(f);
public boolean isDirectory(Path f) throws IOException {
return underlyingFs.isDirectory(f);
public boolean isFile(Path f) throws IOException {
return underlyingFs.isFile(f);
public long getLength(Path f) throws IOException {
return underlyingFs.getLength(f);
public ContentSummary getContentSummary(Path f) throws IOException {
return underlyingFs.getContentSummary(f);
public URI getUri() {
return underlyingFs.getUri();
@LimitedPrivate({"HDFS", "MapReduce"})
public String getCanonicalServiceName() {
return underlyingFs.getCanonicalServiceName();
public String getName() {
return underlyingFs.getName();
public Path makeQualified(Path path) {
return underlyingFs.makeQualified(path);
public Token<?> getDelegationToken(String renewer) throws IOException {
return underlyingFs.getDelegationToken(renewer);
@LimitedPrivate({"HDFS", "MapReduce"})
public Token<?>[] addDelegationTokens(String renewer, Credentials credentials) throws IOException {
return underlyingFs.addDelegationTokens(renewer, credentials);
public FileSystem[] getChildFileSystems() {
return underlyingFs.getChildFileSystems();
public BlockLocation[] getFileBlockLocations(FileStatus file, long start, long len) throws IOException {
return underlyingFs.getFileBlockLocations(file, start, len);
public BlockLocation[] getFileBlockLocations(Path p, long start, long len) throws IOException {
return underlyingFs.getFileBlockLocations(p, start, len);
public FsServerDefaults getServerDefaults() throws IOException {
return underlyingFs.getServerDefaults();
public FsServerDefaults getServerDefaults(Path p) throws IOException {
return underlyingFs.getServerDefaults(p);
public Path resolvePath(Path p) throws IOException {
return underlyingFs.resolvePath(p);
public boolean truncate(final Path f, final long newLength) throws IOException {
return underlyingFs.truncate(f, newLength);
public RemoteIterator<FileStatus> listStatusIterator(final Path p) throws FileNotFoundException, IOException {
return underlyingFs.listStatusIterator(p);
public void access(final Path path, final FsAction mode) throws AccessControlException, FileNotFoundException, IOException {
underlyingFs.access(path, mode);
public FileChecksum getFileChecksum(final Path f, final long length) throws IOException {
return underlyingFs.getFileChecksum(f, length);
public void setXAttr(final Path path, final String name, final byte[] value) throws IOException {
underlyingFs.setXAttr(path, name, value);
public void setXAttr(final Path path, final String name, final byte[] value, final EnumSet<XAttrSetFlag> flag) throws IOException {
underlyingFs.setXAttr(path, name, value, flag);
public byte[] getXAttr(final Path path, final String name) throws IOException {
return underlyingFs.getXAttr(path, name);
public Map<String, byte[]> getXAttrs(final Path path) throws IOException {
return underlyingFs.getXAttrs(path);
public Map<String, byte[]> getXAttrs(final Path path, final List<String> names) throws IOException {
return underlyingFs.getXAttrs(path, names);
public List<String> listXAttrs(final Path path) throws IOException {
return underlyingFs.listXAttrs(path);
public void removeXAttr(final Path path, final String name) throws IOException {
underlyingFs.removeXAttr(path, name);
public InputStream openPossiblyCompressedStream(Path path) throws IOException {
CompressionCodec codec = codecFactory.getCodec(path); // infers from file ext.
if (codec != null) {
return codec.createInputStream(open(path));
} else {
return open(path);
public void fileOpened(Path path, DrillFSDataInputStream fsDataInputStream) {
openedFiles.put(fsDataInputStream, new DebugStackTrace(path, Thread.currentThread().getStackTrace()));
public void fileClosed(DrillFSDataInputStream fsDataInputStream) {
public static class DebugStackTrace {
final private StackTraceElement[] elements;
final private Path path;
public DebugStackTrace(Path path, StackTraceElement[] elements) {
this.path = path;
this.elements = elements;
public void addToStringBuilder(StringBuffer sb) {
sb.append("File '");
sb.append("' opened at callstack:\n");
// add all stack elements except the top three as they point to and inner stack elements.
for (int i = 3; i < elements.length; i++) {