blob: b6e7e720b7dbaacb285bd65afd9607aab50b56b5 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
import com.jayway.jsonpath.JsonPath
import groovy.json.JsonSlurper
import org.apache.hadoop.gateway.shell.Hadoop
import org.apache.hadoop.gateway.shell.hdfs.Hdfs
import org.apache.hadoop.gateway.shell.workflow.Workflow
import static java.util.concurrent.TimeUnit.SECONDS
import org.apache.hadoop.gateway.shell.Credentials
gateway = "https://localhost:8443/gateway/sandbox"
inputFile = "LICENSE"
jarFile = "samples/hadoop-examples.jar"
gateway = "https://localhost:8443/gateway/sandbox"
tableName = "test_table"
credentials = new Credentials()
credentials.add("ClearInput", "Enter username: ", "user")
.add("HiddenInput", "Enter pas" + "sword: ", "pass")
credentials.collect()
username = credentials.get("user").string()
pass = credentials.get("pass").string()
jobDir = "/user/" + username + "/test"
definition = """\
<workflow-app xmlns="uri:oozie:workflow:0.2" name="wordcount-workflow">
<start to="root-node"/>
<action name="root-node">
<java>
<job-tracker>\${jobTracker}</job-tracker>
<name-node>\${nameNode}</name-node>
<main-class>org.apache.hadoop.examples.WordCount</main-class>
<arg>\${inputDir}</arg>
<arg>\${outputDir}</arg>
</java>
<ok to="end"/>
<error to="fail"/>
</action>
<kill name="fail">
<message>Java failed, error message[\${wf:errorMessage(wf:lastErrorNode())}]</message>
</kill>
<end name="end"/>
</workflow-app>
"""
configuration = """\
<configuration>
<property>
<name>user.name</name>
<value>default</value>
</property>
<property>
<name>nameNode</name>
<value>default</value>
</property>
<property>
<name>jobTracker</name>
<value>default</value>
</property>
<property>
<name>inputDir</name>
<value>$jobDir/input</value>
</property>
<property>
<name>outputDir</name>
<value>$jobDir/output</value>
</property>
<property>
<name>oozie.wf.application.path</name>
<value>$jobDir</value>
</property>
</configuration>
"""
session = Hadoop.login( gateway, username, pass )
println "Delete " + jobDir + ": " + Hdfs.rm( session ).file( jobDir ).recursive().now().statusCode
println "Mkdir " + jobDir + ": " + Hdfs.mkdir( session ).dir( jobDir ).now().statusCode
putData = Hdfs.put(session).file( inputFile ).to( jobDir + "/input/FILE" ).later() {
println "Put " + jobDir + "/input/FILE: " + it.statusCode }
putJar = Hdfs.put(session).file( jarFile ).to( jobDir + "/lib/hadoop-examples.jar" ).later() {
println "Put " + jobDir + "/lib/hadoop-examples.jar: " + it.statusCode }
putWorkflow = Hdfs.put(session).text( definition ).to( jobDir + "/workflow.xml" ).later() {
println "Put " + jobDir + "/workflow.xml: " + it.statusCode }
session.waitFor( putWorkflow, putData, putJar )
jobId = Workflow.submit(session).text( configuration ).now().jobId
println "Submitted job: " + jobId
println "Polling up to 60s for job completion..."
status = "RUNNING";
count = 0;
while( status == "RUNNING" && count++ < 60 ) {
sleep( 1000 )
json = Workflow.status(session).jobId( jobId ).now().string
status = JsonPath.read( json, "\$.status" )
print "."; System.out.flush();
}
println ""
println "Job status: " + status
if( status == "SUCCEEDED" ) {
text = Hdfs.ls( session ).dir( jobDir + "/output" ).now().string
json = (new JsonSlurper()).parseText( text )
println json.FileStatuses.FileStatus.pathSuffix
}
println "Session closed: " + session.shutdown( 10, SECONDS )