hadoop-tools/hadoop-rumen/src/main/java/org/apache/hadoop/tools/rumen/JobHistoryUtils.java - hadoop - Git at Google

 /**
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
 package org.apache.hadoop.tools.rumen;

 import java.io.IOException;
 import java.util.HashMap;
 import java.util.Map;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;

 import org.apache.hadoop.mapreduce.JobID;
 import org.apache.hadoop.mapreduce.jobhistory.JhCounter;
 import org.apache.hadoop.mapreduce.jobhistory.JhCounterGroup;
 import org.apache.hadoop.mapreduce.jobhistory.JhCounters;
 import org.apache.hadoop.mapreduce.v2.hs.JobHistory;

 /**
  * Job History related utils for handling multiple formats of history logs of
  * different hadoop versions like Pre21 history logs, current history logs.
  */
 public class JobHistoryUtils {

   private static String applyParser(String fileName, Pattern pattern) {
     Matcher matcher = pattern.matcher(fileName);

     if (!matcher.matches()) {
       return null;
     }

     return matcher.group(1);
   }

   /**
    * Extracts jobID string from the given job history log file name or
    * job history configuration file name.
    * @param fileName name of job history file or job history configuration file
    * @return a valid jobID String, parsed out of the file name. Otherwise,
    *         [especially for .crc files] returns null.
    */
   static String extractJobID(String fileName) {
     // Get jobID if fileName is a config file name.
     String jobId = extractJobIDFromConfFileName(fileName);
     if (jobId == null) {
       // Get JobID if fileName is a job history file name
       jobId = extractJobIDFromHistoryFileName(fileName);
     }
     return jobId;
   }

   /**
    * Extracts job id from the current hadoop version's job history file name.
    * @param fileName job history file name from which job id is to be extracted
    * @return job id if the history file name format is same as that of the
    * current hadoop version. Returns null otherwise.
    */
   private static String extractJobIDFromCurrentHistoryFile(String fileName) {
     JobID id = null;
     if (org.apache.hadoop.mapreduce.v2.jobhistory.JobHistoryUtils
             .isValidJobHistoryFileName(fileName)) {
       try {
         id = org.apache.hadoop.mapreduce.v2.jobhistory.JobHistoryUtils
                  .getJobIDFromHistoryFilePath(fileName);
       } catch (IOException e) {
         // Ignore this exception and go ahead with getting of jobID assuming
         // older hadoop verison's history file
       }
     }
     if (id != null) {
       return id.toString();
     }
     return null;
   }

   /**
    * Extracts jobID string from the given job history file name.
    * @param fileName name of the job history file
    * @return JobID if the given <code>fileName</code> is a valid job history
    *         file name, <code>null</code> otherwise.
    */
   private static String extractJobIDFromHistoryFileName(String fileName) {
     // History file name could be in one of the following formats
     // (1) old pre21 job history file name format
     // (2) new pre21 job history file name format
     // (3) current job history file name format i.e. 0.22

     // Try to get the jobID assuming that the history file is from the current
     // hadoop version
     String jobID = extractJobIDFromCurrentHistoryFile(fileName);
     if (jobID != null) {
       return jobID;//history file is of current hadoop version
     }

     // History file could be of older hadoop versions
     String pre21JobID = applyParser(fileName,
         Pre21JobHistoryConstants.JOBHISTORY_FILENAME_REGEX_V1);
     if (pre21JobID == null) {
       pre21JobID = applyParser(fileName,
           Pre21JobHistoryConstants.JOBHISTORY_FILENAME_REGEX_V2);
     }
     return pre21JobID;
   }

   /**
    * Extracts jobID string from the given job conf xml file name.
    * @param fileName name of the job conf xml file
    * @return job id if the given <code>fileName</code> is a valid job conf xml
    *         file name, <code>null</code> otherwise.
    */
   private static String extractJobIDFromConfFileName(String fileName) {
     // History conf file name could be in one of the following formats
     // (1) old pre21 job history file name format
     // (2) new pre21 job history file name format
     // (3) current job history file name format i.e. 0.22
     String pre21JobID = applyParser(fileName,
                           Pre21JobHistoryConstants.CONF_FILENAME_REGEX_V1);
     if (pre21JobID == null) {
       pre21JobID = applyParser(fileName,
                      Pre21JobHistoryConstants.CONF_FILENAME_REGEX_V2);
     }
     if (pre21JobID != null) {
       return pre21JobID;
     }
     return applyParser(fileName, JobHistory.CONF_FILENAME_REGEX);
   }

   /**
    * Checks if the given <code>fileName</code> is a valid job conf xml file name
    * @param fileName name of the file to be validated
    * @return <code>true</code> if the given <code>fileName</code> is a valid
    *         job conf xml file name.
    */
   static boolean isJobConfXml(String fileName) {
     String jobId = extractJobIDFromConfFileName(fileName);
     return jobId != null;
   }

   /**
    * Extract/Add counters into the Map from the given JhCounters object.
    * @param counters the counters to be extracted from
    * @return the map of counters
    */
   static Map<String, Long> extractCounters(JhCounters counters) {
     Map<String, Long> countersMap = new HashMap<String, Long>();
     if (counters != null) {
       for (JhCounterGroup group : counters.groups) {
         for (JhCounter counter : group.counts) {
           countersMap.put(counter.name.toString(), counter.value);
         }
       }
     }
     return countersMap;
   }
 }
	/**
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/
	package org.apache.hadoop.tools.rumen;

	import java.io.IOException;
	import java.util.HashMap;
	import java.util.Map;
	import java.util.regex.Matcher;
	import java.util.regex.Pattern;

	import org.apache.hadoop.mapreduce.JobID;
	import org.apache.hadoop.mapreduce.jobhistory.JhCounter;
	import org.apache.hadoop.mapreduce.jobhistory.JhCounterGroup;
	import org.apache.hadoop.mapreduce.jobhistory.JhCounters;
	import org.apache.hadoop.mapreduce.v2.hs.JobHistory;

	/**
	* Job History related utils for handling multiple formats of history logs of
	* different hadoop versions like Pre21 history logs, current history logs.
	*/
	public class JobHistoryUtils {

	private static String applyParser(String fileName, Pattern pattern) {
	Matcher matcher = pattern.matcher(fileName);

	if (!matcher.matches()) {
	return null;
	}

	return matcher.group(1);
	}

	/**
	* Extracts jobID string from the given job history log file name or
	* job history configuration file name.
	* @param fileName name of job history file or job history configuration file
	* @return a valid jobID String, parsed out of the file name. Otherwise,
	* [especially for .crc files] returns null.
	*/
	static String extractJobID(String fileName) {
	// Get jobID if fileName is a config file name.
	String jobId = extractJobIDFromConfFileName(fileName);
	if (jobId == null) {
	// Get JobID if fileName is a job history file name
	jobId = extractJobIDFromHistoryFileName(fileName);
	}
	return jobId;
	}

	/**
	* Extracts job id from the current hadoop version's job history file name.
	* @param fileName job history file name from which job id is to be extracted
	* @return job id if the history file name format is same as that of the
	* current hadoop version. Returns null otherwise.
	*/
	private static String extractJobIDFromCurrentHistoryFile(String fileName) {
	JobID id = null;
	if (org.apache.hadoop.mapreduce.v2.jobhistory.JobHistoryUtils
	.isValidJobHistoryFileName(fileName)) {
	try {
	id = org.apache.hadoop.mapreduce.v2.jobhistory.JobHistoryUtils
	.getJobIDFromHistoryFilePath(fileName);
	} catch (IOException e) {
	// Ignore this exception and go ahead with getting of jobID assuming
	// older hadoop verison's history file
	}
	}
	if (id != null) {
	return id.toString();
	}
	return null;
	}

	/**
	* Extracts jobID string from the given job history file name.
	* @param fileName name of the job history file
	* @return JobID if the given <code>fileName</code> is a valid job history
	* file name, <code>null</code> otherwise.
	*/
	private static String extractJobIDFromHistoryFileName(String fileName) {
	// History file name could be in one of the following formats
	// (1) old pre21 job history file name format
	// (2) new pre21 job history file name format
	// (3) current job history file name format i.e. 0.22

	// Try to get the jobID assuming that the history file is from the current
	// hadoop version
	String jobID = extractJobIDFromCurrentHistoryFile(fileName);
	if (jobID != null) {
	return jobID;//history file is of current hadoop version
	}

	// History file could be of older hadoop versions
	String pre21JobID = applyParser(fileName,
	Pre21JobHistoryConstants.JOBHISTORY_FILENAME_REGEX_V1);
	if (pre21JobID == null) {
	pre21JobID = applyParser(fileName,
	Pre21JobHistoryConstants.JOBHISTORY_FILENAME_REGEX_V2);
	}
	return pre21JobID;
	}

	/**
	* Extracts jobID string from the given job conf xml file name.
	* @param fileName name of the job conf xml file
	* @return job id if the given <code>fileName</code> is a valid job conf xml
	* file name, <code>null</code> otherwise.
	*/
	private static String extractJobIDFromConfFileName(String fileName) {
	// History conf file name could be in one of the following formats
	// (1) old pre21 job history file name format
	// (2) new pre21 job history file name format
	// (3) current job history file name format i.e. 0.22
	String pre21JobID = applyParser(fileName,
	Pre21JobHistoryConstants.CONF_FILENAME_REGEX_V1);
	if (pre21JobID == null) {
	pre21JobID = applyParser(fileName,
	Pre21JobHistoryConstants.CONF_FILENAME_REGEX_V2);
	}
	if (pre21JobID != null) {
	return pre21JobID;
	}
	return applyParser(fileName, JobHistory.CONF_FILENAME_REGEX);
	}

	/**
	* Checks if the given <code>fileName</code> is a valid job conf xml file name
	* @param fileName name of the file to be validated
	* @return <code>true</code> if the given <code>fileName</code> is a valid
	* job conf xml file name.
	*/
	static boolean isJobConfXml(String fileName) {
	String jobId = extractJobIDFromConfFileName(fileName);
	return jobId != null;
	}

	/**
	* Extract/Add counters into the Map from the given JhCounters object.
	* @param counters the counters to be extracted from
	* @return the map of counters
	*/
	static Map<String, Long> extractCounters(JhCounters counters) {
	Map<String, Long> countersMap = new HashMap<String, Long>();
	if (counters != null) {
	for (JhCounterGroup group : counters.groups) {
	for (JhCounter counter : group.counts) {
	countersMap.put(counter.name.toString(), counter.value);
	}
	}
	}
	return countersMap;
	}
	}