| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.hadoop.mapreduce; |
| |
| import java.io.FileNotFoundException; |
| import java.io.IOException; |
| |
| import com.google.common.annotations.VisibleForTesting; |
| import org.apache.hadoop.fs.FileStatus; |
| import org.apache.hadoop.fs.FileSystem; |
| import org.apache.hadoop.fs.Path; |
| import org.apache.hadoop.fs.permission.FsPermission; |
| import org.apache.hadoop.security.UserGroupInformation; |
| import org.apache.hadoop.classification.InterfaceAudience; |
| import org.apache.hadoop.conf.Configuration; |
| |
| import org.apache.commons.logging.Log; |
| import org.apache.commons.logging.LogFactory; |
| |
| /** |
| * A utility to manage job submission files. |
| */ |
| @InterfaceAudience.Private |
| public class JobSubmissionFiles { |
| |
| private final static Log LOG = LogFactory.getLog(JobSubmissionFiles.class); |
| |
| // job submission directory is private! |
| final public static FsPermission JOB_DIR_PERMISSION = |
| FsPermission.createImmutable((short) 0700); // rwx------ |
| //job files are world-wide readable and owner writable |
| final public static FsPermission JOB_FILE_PERMISSION = |
| FsPermission.createImmutable((short) 0644); // rw-r--r-- |
| |
| public static Path getJobSplitFile(Path jobSubmissionDir) { |
| return new Path(jobSubmissionDir, "job.split"); |
| } |
| |
| public static Path getJobSplitMetaFile(Path jobSubmissionDir) { |
| return new Path(jobSubmissionDir, "job.splitmetainfo"); |
| } |
| |
| /** |
| * Get the job conf path. |
| */ |
| public static Path getJobConfPath(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "job.xml"); |
| } |
| |
| /** |
| * Get the job jar path. |
| */ |
| public static Path getJobJar(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "job.jar"); |
| } |
| |
| /** |
| * Get the job distributed cache files path. |
| * @param jobSubmitDir |
| */ |
| public static Path getJobDistCacheFiles(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "files"); |
| } |
| |
| /** |
| * Get the job distributed cache path for log4j properties. |
| * @param jobSubmitDir |
| */ |
| public static Path getJobLog4jFile(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "log4j"); |
| } |
| /** |
| * Get the job distributed cache archives path. |
| * @param jobSubmitDir |
| */ |
| public static Path getJobDistCacheArchives(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "archives"); |
| } |
| /** |
| * Get the job distributed cache libjars path. |
| * @param jobSubmitDir |
| */ |
| public static Path getJobDistCacheLibjars(Path jobSubmitDir) { |
| return new Path(jobSubmitDir, "libjars"); |
| } |
| |
| /** |
| * Initializes the staging directory and returns the path. It also |
| * keeps track of all necessary ownership and permissions |
| * @param cluster |
| * @param conf |
| */ |
| public static Path getStagingDir(Cluster cluster, Configuration conf) |
| throws IOException, InterruptedException { |
| UserGroupInformation user = UserGroupInformation.getLoginUser(); |
| return getStagingDir(cluster, conf, user); |
| } |
| |
| /** |
| * Initializes the staging directory and returns the path. It also |
| * keeps track of all necessary ownership and permissions. |
| * It is kept for unit testing. |
| * |
| * @param cluster Information about the map/reduce cluster |
| * @param conf Configuration object |
| * @param realUser UserGroupInformation of login user |
| * @return staging dir path object |
| * @throws IOException when ownership of staging area directory does |
| * not match the login user or current user. |
| * @throws InterruptedException when getting the staging area directory path |
| */ |
| @VisibleForTesting |
| public static Path getStagingDir(Cluster cluster, Configuration conf, |
| UserGroupInformation realUser) throws IOException, InterruptedException { |
| Path stagingArea = cluster.getStagingAreaDir(); |
| FileSystem fs = stagingArea.getFileSystem(conf); |
| UserGroupInformation currentUser = realUser.getCurrentUser(); |
| try { |
| FileStatus fsStatus = fs.getFileStatus(stagingArea); |
| String fileOwner = fsStatus.getOwner(); |
| if (!(fileOwner.equals(currentUser.getShortUserName()) || fileOwner |
| .equalsIgnoreCase(currentUser.getUserName()) || fileOwner |
| .equals(realUser.getShortUserName()) || fileOwner |
| .equalsIgnoreCase(realUser.getUserName()))) { |
| String errorMessage = "The ownership on the staging directory " + |
| stagingArea + " is not as expected. " + |
| "It is owned by " + fileOwner + ". The directory must " + |
| "be owned by the submitter " + currentUser.getShortUserName() |
| + " or " + currentUser.getUserName(); |
| if (!realUser.getUserName().equals(currentUser.getUserName())) { |
| throw new IOException( |
| errorMessage + " or " + realUser.getShortUserName() + " or " |
| + realUser.getUserName()); |
| } else { |
| throw new IOException(errorMessage); |
| } |
| } |
| if (!fsStatus.getPermission().equals(JOB_DIR_PERMISSION)) { |
| LOG.info("Permissions on staging directory " + stagingArea + " are " + |
| "incorrect: " + fsStatus.getPermission() + ". Fixing permissions " + |
| "to correct value " + JOB_DIR_PERMISSION); |
| fs.setPermission(stagingArea, JOB_DIR_PERMISSION); |
| } |
| } catch (FileNotFoundException e) { |
| fs.mkdirs(stagingArea, new FsPermission(JOB_DIR_PERMISSION)); |
| } |
| return stagingArea; |
| } |
| } |