blob: e933d108d2580c741f44336abd37bc528dfd1fce [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.mapreduce.server.tasktracker;
import java.io.File;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
import java.util.concurrent.atomic.AtomicBoolean;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.classification.InterfaceAudience;
import org.apache.hadoop.classification.InterfaceStability;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.FileUtil;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.permission.FsPermission;
import org.apache.hadoop.mapred.TaskController;
import org.apache.hadoop.mapred.TaskLog;
import org.apache.hadoop.mapred.TaskTracker;
import org.apache.hadoop.mapred.TaskController.InitializationContext;
import org.apache.hadoop.mapreduce.JobID;
@InterfaceAudience.Private
@InterfaceStability.Unstable
public class Localizer {
static final Log LOG = LogFactory.getLog(Localizer.class);
private FileSystem fs;
private String[] localDirs;
private TaskController taskController;
/**
* Create a Localizer instance
*
* @param fileSys
* @param lDirs
* @param tc
*/
public Localizer(FileSystem fileSys, String[] lDirs, TaskController tc) {
fs = fileSys;
localDirs = lDirs;
taskController = tc;
}
// Data-structure for synchronizing localization of user directories.
private Map<String, AtomicBoolean> localizedUsers =
new HashMap<String, AtomicBoolean>();
/**
* Initialize the local directories for a particular user on this TT. This
* involves creation and setting permissions of the following directories
* <ul>
* <li>$mapreduce.cluster.local.dir/taskTracker/$user</li>
* <li>$mapreduce.cluster.local.dir/taskTracker/$user/jobcache</li>
* <li>$mapreduce.cluster.local.dir/taskTracker/$user/distcache</li>
* </ul>
*
* @param user
* @throws IOException
*/
public void initializeUserDirs(String user)
throws IOException {
if (user == null) {
// This shouldn't happen in general
throw new IOException(
"User is null. Cannot initialized user-directories.");
}
AtomicBoolean localizedUser;
synchronized (localizedUsers) {
if (!localizedUsers.containsKey(user)) {
localizedUsers.put(user, new AtomicBoolean(false));
}
localizedUser = localizedUsers.get(user);
}
synchronized (localizedUser) {
if (localizedUser.get()) {
// User-directories are already localized for this user.
LOG.info("User-directories for the user " + user
+ " are already initialized on this TT. Not doing anything.");
return;
}
LOG.info("Initializing user " + user + " on this TT.");
boolean userDirStatus = false;
boolean jobCacheDirStatus = false;
boolean distributedCacheDirStatus = false;
for (String localDir : localDirs) {
Path userDir = new Path(localDir, TaskTracker.getUserDir(user));
// Set up the user-directory.
if (fs.exists(userDir) || fs.mkdirs(userDir)) {
// Set permissions on the user-directory
fs.setPermission(userDir, new FsPermission((short)0700));
userDirStatus = true;
// Set up the jobcache directory
Path jobCacheDir =
new Path(localDir, TaskTracker.getJobCacheSubdir(user));
if (fs.exists(jobCacheDir) || fs.mkdirs(jobCacheDir)) {
// Set permissions on the jobcache-directory
fs.setPermission(jobCacheDir, new FsPermission((short)0700));
jobCacheDirStatus = true;
} else {
LOG.warn("Unable to create job cache directory : "
+ jobCacheDir);
}
// Set up the cache directory used for distributed cache files
Path distributedCacheDir =
new Path(localDir, TaskTracker.getPrivateDistributedCacheDir(user));
if (fs.exists(distributedCacheDir) || fs.mkdirs(distributedCacheDir)) {
// Set permissions on the distcache-directory
fs.setPermission(distributedCacheDir, new FsPermission((short)0700));
distributedCacheDirStatus = true;
} else {
LOG.warn("Unable to create distributed-cache directory : "
+ distributedCacheDir);
}
} else {
LOG.warn("Unable to create the user directory : " + userDir);
}
}
if (!userDirStatus) {
throw new IOException("Not able to initialize user directories "
+ "in any of the configured local directories for user " + user);
}
if (!jobCacheDirStatus) {
throw new IOException("Not able to initialize job-cache directories "
+ "in any of the configured local directories for user " + user);
}
if (!distributedCacheDirStatus) {
throw new IOException(
"Not able to initialize distributed-cache directories "
+ "in any of the configured local directories for user "
+ user);
}
// Now, run the task-controller specific code to initialize the
// user-directories.
InitializationContext context = new InitializationContext();
context.user = user;
context.workDir = null;
taskController.initializeUser(context);
// Localization of the user is done
localizedUser.set(true);
}
}
/**
* Prepare the job directories for a given job. To be called by the job
* localization code, only if the job is not already localized.
*
* <br>
* Here, we set 700 permissions on the job directories created on all disks.
* This we do so as to avoid any misuse by other users till the time
* {@link TaskController#initializeJob(JobInitializationContext)} is run at a
* later time to set proper private permissions on the job directories. <br>
*
* @param user
* @param jobId
* @throws IOException
*/
public void initializeJobDirs(String user, JobID jobId)
throws IOException {
boolean initJobDirStatus = false;
String jobDirPath = TaskTracker.getLocalJobDir(user, jobId.toString());
for (String localDir : localDirs) {
Path jobDir = new Path(localDir, jobDirPath);
if (fs.exists(jobDir)) {
// this will happen on a partial execution of localizeJob. Sometimes
// copying job.xml to the local disk succeeds but copying job.jar might
// throw out an exception. We should clean up and then try again.
fs.delete(jobDir, true);
}
boolean jobDirStatus = fs.mkdirs(jobDir);
if (!jobDirStatus) {
LOG.warn("Not able to create job directory " + jobDir.toString());
}
initJobDirStatus = initJobDirStatus || jobDirStatus;
// job-dir has to be private to the TT
fs.setPermission(jobDir, new FsPermission((short)0700));
}
if (!initJobDirStatus) {
throw new IOException("Not able to initialize job directories "
+ "in any of the configured local directories for job "
+ jobId.toString());
}
}
/**
* Create taskDirs on all the disks. Otherwise, in some cases, like when
* LinuxTaskController is in use, child might wish to balance load across
* disks but cannot itself create attempt directory because of the fact that
* job directory is writable only by the TT.
*
* @param user
* @param jobId
* @param attemptId
* @param isCleanupAttempt
* @throws IOException
*/
public void initializeAttemptDirs(String user, String jobId,
String attemptId, boolean isCleanupAttempt)
throws IOException {
boolean initStatus = false;
String attemptDirPath =
TaskTracker.getLocalTaskDir(user, jobId, attemptId, isCleanupAttempt);
for (String localDir : localDirs) {
Path localAttemptDir = new Path(localDir, attemptDirPath);
boolean attemptDirStatus = fs.mkdirs(localAttemptDir);
if (!attemptDirStatus) {
LOG.warn("localAttemptDir " + localAttemptDir.toString()
+ " couldn't be created.");
}
initStatus = initStatus || attemptDirStatus;
}
if (!initStatus) {
throw new IOException("Not able to initialize attempt directories "
+ "in any of the configured local directories for the attempt "
+ attemptId);
}
}
/**
* Create job log directory and set appropriate permissions for the directory.
*
* @param jobId
*/
public void initializeJobLogDir(JobID jobId) throws IOException {
Path jobUserLogDir = new Path(TaskLog.getJobDir(jobId).getCanonicalPath());
if (!fs.mkdirs(jobUserLogDir)) {
throw new IOException("Could not create job user log directory: " +
jobUserLogDir);
}
fs.setPermission(jobUserLogDir, new FsPermission((short)0700));
}
}