blob: 90d28259f5b1628bf8374b77535b1d81f9b98d66 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tez.mapreduce.examples;
import java.io.IOException;
import java.text.DecimalFormat;
import java.util.EnumSet;
import java.util.Set;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.util.ProgramDriver;
import org.apache.tez.common.counters.TezCounters;
import org.apache.tez.dag.api.TezException;
import org.apache.tez.dag.api.client.DAGClient;
import org.apache.tez.dag.api.client.DAGStatus;
import org.apache.tez.dag.api.client.Progress;
import org.apache.tez.dag.api.client.StatusGetOpts;
import org.apache.tez.dag.api.client.VertexStatus;
import org.apache.tez.mapreduce.hadoop.MRConfig;
/**
* A description of an example program based on its class and a
* human-readable description.
*/
public class ExampleDriver {
private static final DecimalFormat formatter = new DecimalFormat("###.##%");
public static void main(String argv[]){
int exitCode = -1;
ProgramDriver pgd = new ProgramDriver();
try {
pgd.addClass("broadcastloadgen", BroadcastLoadGen.class,
"Run a DAG to generate load for Broadcast Shuffle");
pgd.addClass("rpcloadgen", RPCLoadGen.class,
"Run a DAG to generate load for the task to AM RPC");
pgd.addClass("wordcount", MapredWordCount.class,
"A map/reduce program that counts the words in the input files.");
pgd.addClass("mapredwordcount", MapredWordCount.class,
"A map/reduce program that counts the words in the input files"
+ " using the mapred apis.");
pgd.addClass("randomwriter", RandomWriter.class,
"A map/reduce program that writes 10GB of random data per node.");
pgd.addClass("randomtextwriter", RandomTextWriter.class,
"A map/reduce program that writes 10GB of random textual data per node.");
pgd.addClass("sort", Sort.class,
"A map/reduce program that sorts the data written by the random"
+ " writer.");
pgd.addClass("secondarysort", SecondarySort.class,
"An example defining a secondary sort to the reduce.");
pgd.addClass("join", Join.class,
"A job that effects a join over sorted, equally partitioned"
+ " datasets");
pgd.addClass("mrrsleep", MRRSleepJob.class,
"MRR Sleep Job");
pgd.addClass("testorderedwordcount", TestOrderedWordCount.class,
"Word Count with words sorted on frequency");
pgd.addClass("unionexample", UnionExample.class,
"Union example");
pgd.addClass("broadcastAndOneToOneExample", BroadcastAndOneToOneExample.class,
"BroadcastAndOneToOneExample example");
pgd.addClass("filterLinesByWord", FilterLinesByWord.class,
"Filters lines by the specified word using broadcast edge");
pgd.addClass("filterLinesByWordOneToOne", FilterLinesByWordOneToOne.class,
"Filters lines by the specified word using OneToOne edge");
pgd.addClass("multiplecommitsExample", MultipleCommitsExample.class,
"Job with multiple commits in both vertex group and vertex");
exitCode = pgd.run(argv);
}
catch(Throwable e){
e.printStackTrace();
}
System.exit(exitCode);
}
public static Configuration getTezDecoratedConfiguration() {
Configuration configuration = new Configuration();
configuration.set(MRConfig.FRAMEWORK_NAME, MRConfig.YARN_TEZ_FRAMEWORK_NAME);
return configuration;
}
public static void printDAGStatus(DAGClient dagClient, String[] vertexNames)
throws IOException, TezException {
printDAGStatus(dagClient, vertexNames, false, false);
}
public static void printDAGStatus(DAGClient dagClient, String[] vertexNames,
boolean displayDAGCounters, boolean displayVertexCounters)
throws IOException, TezException {
Set<StatusGetOpts> opts = EnumSet.of(StatusGetOpts.GET_COUNTERS);
DAGStatus dagStatus = dagClient.getDAGStatus(
(displayDAGCounters ? opts : null));
Progress progress = dagStatus.getDAGProgress();
double vProgressFloat = 0.0f;
if (progress != null) {
System.out.println("");
System.out.println("DAG: State: "
+ dagStatus.getState()
+ " Progress: "
+ (progress.getTotalTaskCount() < 0 ? formatter.format(0.0f) :
formatter.format((double)(progress.getSucceededTaskCount())
/progress.getTotalTaskCount())));
for (String vertexName : vertexNames) {
VertexStatus vStatus = dagClient.getVertexStatus(vertexName,
(displayVertexCounters ? opts : null));
if (vStatus == null) {
System.out.println("Could not retrieve status for vertex: "
+ vertexName);
continue;
}
Progress vProgress = vStatus.getProgress();
if (vProgress != null) {
vProgressFloat = 0.0f;
if (vProgress.getTotalTaskCount() == 0) {
vProgressFloat = 1.0f;
} else if (vProgress.getTotalTaskCount() > 0) {
vProgressFloat = (double)vProgress.getSucceededTaskCount()
/vProgress.getTotalTaskCount();
}
System.out.println("VertexStatus:"
+ " VertexName: "
+ (vertexName.equals("ivertex1") ? "intermediate-reducer"
: vertexName)
+ " Progress: " + formatter.format(vProgressFloat));
}
if (displayVertexCounters) {
TezCounters counters = vStatus.getVertexCounters();
if (counters != null) {
System.out.println("Vertex Counters for " + vertexName + ": "
+ counters);
}
}
}
}
if (displayDAGCounters) {
TezCounters counters = dagStatus.getDAGCounters();
if (counters != null) {
System.out.println("DAG Counters: " + counters);
}
}
}
}