| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.oozie.action.hadoop; |
| |
| import org.apache.hadoop.fs.FileSystem; |
| import org.apache.hadoop.fs.Path; |
| import org.apache.oozie.util.XConfiguration; |
| import org.apache.oozie.util.IOUtils; |
| import org.json.simple.JSONValue; |
| |
| import java.io.File; |
| import java.io.FileInputStream; |
| import java.io.FileOutputStream; |
| import java.io.InputStreamReader; |
| import java.io.OutputStream; |
| import java.io.OutputStreamWriter; |
| import java.io.Writer; |
| import java.nio.charset.StandardCharsets; |
| import java.util.ArrayList; |
| import java.util.LinkedHashSet; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Properties; |
| import java.util.Set; |
| import java.net.URL; |
| |
| public class TestPigMain extends PigTestCase { |
| private SecurityManager SECURITY_MANAGER; |
| |
| @Override |
| protected void setUp() throws Exception { |
| super.setUp(); |
| SECURITY_MANAGER = System.getSecurityManager(); |
| resetPigStats(); |
| } |
| |
| @Override |
| protected void tearDown() throws Exception { |
| System.setSecurityManager(SECURITY_MANAGER); |
| resetPigStats(); |
| super.tearDown(); |
| } |
| |
| @Override |
| protected List<File> getFilesToDelete() { |
| List<File> filesToDelete = super.getFilesToDelete(); |
| filesToDelete.add(new File("pig.properties")); |
| return filesToDelete; |
| } |
| |
| @Override |
| public Void call() throws Exception { |
| FileSystem fs = getFileSystem(); |
| |
| Path script = new Path(getTestCaseDir(), "script.pig"); |
| Writer w = new OutputStreamWriter(new FileOutputStream(script.toString()), StandardCharsets.UTF_8); |
| w.write(pigScript); |
| w.close(); |
| |
| Path inputDir = new Path(getFsTestCaseDir(), "input"); |
| fs.mkdirs(inputDir); |
| Writer writer = new OutputStreamWriter(fs.create(new Path(inputDir, "data.txt")), |
| StandardCharsets.UTF_8); |
| writer.write("hello"); |
| writer.close(); |
| |
| Path outputDir = new Path(getFsTestCaseDir(), "output"); |
| |
| XConfiguration jobConf = new XConfiguration(); |
| XConfiguration.copy(createJobConf(), jobConf); |
| |
| jobConf.set("user.name", getTestUser()); |
| jobConf.set("group.name", getTestGroup()); |
| jobConf.setInt("mapred.map.tasks", 1); |
| jobConf.setInt("mapred.map.max.attempts", 1); |
| jobConf.setInt("mapred.reduce.max.attempts", 1); |
| |
| // option to specify whether stats should be stored or not |
| jobConf.set("oozie.action.external.stats.write", Boolean.toString(writeStats)); |
| |
| jobConf.set("mapreduce.job.tags", "" + System.currentTimeMillis()); |
| setSystemProperty("oozie.job.launch.time", "" + System.currentTimeMillis()); |
| |
| SharelibUtils.addToDistributedCache("pig", fs, getFsTestCaseDir(), jobConf); |
| |
| PigActionExecutor.setPigScript(jobConf, script.toString(), new String[] { "IN=" + inputDir.toUri().getPath(), |
| "OUT=" + outputDir.toUri().getPath() }, new String[] { "-v" }); |
| |
| File actionXml = new File(getTestCaseDir(), "action.xml"); |
| OutputStream os = new FileOutputStream(actionXml); |
| jobConf.writeXml(os); |
| os.close(); |
| |
| File statsDataFile = new File(getTestCaseDir(), "statsdata.properties"); |
| |
| File hadoopIdsFile = new File(getTestCaseDir(), "hadoopIds"); |
| |
| setSystemProperty("oozie.launcher.job.id", "" + System.currentTimeMillis()); |
| setSystemProperty("oozie.action.conf.xml", actionXml.getAbsolutePath()); |
| setSystemProperty("oozie.action.stats.properties", statsDataFile.getAbsolutePath()); |
| setSystemProperty("oozie.action.externalChildIDs", hadoopIdsFile.getAbsolutePath()); |
| |
| |
| URL url = Thread.currentThread().getContextClassLoader().getResource("PigMain.txt"); |
| File classPathDir = new File(url.getPath()).getParentFile(); |
| assertTrue(classPathDir.exists()); |
| Properties props = jobConf.toProperties(); |
| assertEquals(props.getProperty("oozie.pig.args.size"), "1"); |
| File pigProps = new File(classPathDir, "pig.properties"); |
| |
| String user = System.getProperty("user.name"); |
| try { |
| Writer wr = new OutputStreamWriter(new FileOutputStream(pigProps), StandardCharsets.UTF_8); |
| props.store(wr, ""); |
| wr.close(); |
| PigMain.main(null); |
| } |
| finally { |
| pigProps.delete(); |
| System.setProperty("user.name", user); |
| } |
| |
| // Stats should be stored only if option to write stats is set to true |
| if (writeStats) { |
| assertTrue(statsDataFile.exists()); |
| String stats = IOUtils.getReaderAsString(new InputStreamReader( |
| new FileInputStream(statsDataFile), StandardCharsets.UTF_8), -1); |
| // check for some of the expected key values in the stats |
| Map m = (Map) JSONValue.parse(stats); |
| // check for expected 1st level JSON keys |
| assertTrue(m.containsKey("PIG_VERSION")); |
| } else { |
| assertFalse(statsDataFile.exists()); |
| } |
| //File exist only if there is external child jobID. |
| if (hadoopIdsFile.exists()) { |
| String externalChildIds = |
| IOUtils.getReaderAsString(new InputStreamReader(new FileInputStream(hadoopIdsFile), |
| StandardCharsets.UTF_8), -1); |
| assertTrue(externalChildIds.contains("job_")); |
| } |
| return null; |
| } |
| |
| public void testJobIDPattern() { |
| List<String> lines = new ArrayList<String>(); |
| lines.add("HadoopJobId: job_001"); |
| lines.add("Submitted application application_002"); |
| // Non-matching ones |
| lines.add("HadoopJobId is set. job_003"); |
| lines.add("HadoopJobId: abc004"); |
| lines.add("Submitted application = job_005"); |
| lines.add("Submitted application. job_006"); |
| Set<String> jobIds = new LinkedHashSet<String>(); |
| for (String line : lines) { |
| LauncherMain.extractJobIDs(line, PigMain.PIG_JOB_IDS_PATTERNS, jobIds); |
| } |
| Set<String> expected = new LinkedHashSet<String>(); |
| expected.add("job_001"); |
| expected.add("job_002"); |
| assertEquals(expected, jobIds); |
| } |
| |
| } |