blob: 7c799767c29dea53e612f2f788693c362879ed9e [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* http://www.apache.org/licenses/LICENSE-2.0
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pig.test;
import static org.junit.Assert.assertTrue;
import java.io.File;
import java.io.FileOutputStream;
import java.io.IOException;
import java.io.PrintStream;
import java.util.Iterator;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.pig.EvalFunc;
import org.apache.pig.ExecType;
import org.apache.pig.PigServer;
import org.apache.pig.backend.hadoop.datastorage.ConfigurationUtil;
import org.apache.pig.backend.hadoop.executionengine.mapReduceLayer.PigMapReduce;
import org.apache.pig.builtin.PigStorage;
import org.apache.pig.data.BagFactory;
import org.apache.pig.data.Tuple;
import org.apache.pig.data.TupleFactory;
import org.junit.AfterClass;
import org.junit.Before;
import org.junit.Test;
public class TestFinish {
private PigServer pigServer;
TupleFactory mTf = TupleFactory.getInstance();
BagFactory mBf = BagFactory.getInstance();
File f1;
private static MiniGenericCluster cluster = MiniGenericCluster.buildCluster();
static public class MyEvalFunction extends EvalFunc<Tuple> {
String execType;
String expectedFileName;
/**
*
*/
public MyEvalFunction(String execType, String expectedFileName) {
this.execType = execType;
this.expectedFileName = expectedFileName;
}
@Override
public Tuple exec(Tuple input) throws IOException {
return input;
}
@Override
public void finish() {
try {
FileSystem fs = FileSystem.get(PigMapReduce.sJobConfInternal.get());
fs.create(new Path(expectedFileName));
} catch (IOException e) {
throw new RuntimeException("Unable to create file:" + expectedFileName);
}
}
}
@Before
public void setUp() throws Exception {
// Reset state since some tests are in mapred and some in local mode
Util.resetStateForExecModeSwitch();
}
@AfterClass
public static void oneTimeTearDown() throws Exception {
cluster.shutDown();
}
private String setUp(ExecType execType) throws Exception {
String inputFileName;
if (execType == ExecType.LOCAL) {
pigServer = new PigServer(ExecType.LOCAL);
f1 = File.createTempFile("test", "txt");
f1.deleteOnExit();
inputFileName = f1.getAbsolutePath();
PrintStream ps = new PrintStream(new FileOutputStream(f1));
for (int i = 0; i < 3; i++) {
ps.println('a' + i + ":1");
}
ps.close();
} else {
pigServer = new PigServer(cluster.getExecType(), cluster.getProperties());
f1 = File.createTempFile("test", "txt");
f1.delete();
inputFileName = Util.removeColon(f1.getAbsolutePath());
String input[] = new String[3];
for (int i = 0; i < 3; i++) {
input[i] = ('a' + i + ":1");
}
Util.createInputFile(cluster, inputFileName, input);
}
return inputFileName;
}
private void checkAndCleanup(ExecType execType, String expectedFileName,
String inputFileName) throws IOException {
if (execType == cluster.getExecType()) {
FileSystem fs = FileSystem.get(ConfigurationUtil.toConfiguration(
cluster.getProperties()));
assertTrue(fs.exists(new Path(expectedFileName)));
Util.deleteFile(cluster, inputFileName);
Util.deleteFile(cluster, expectedFileName);
} else if (execType == ExecType.LOCAL) {
File f = new File(expectedFileName);
assertTrue(f.exists());
f.delete();
} else {
throw new IllegalArgumentException("invalid excetype " + execType.
toString());
}
}
@Test
public void testFinishInMapMR() throws Exception {
String inputFileName = setUp(cluster.getExecType());
// this file will be created on the cluster if finish() is called
String expectedFileName = "testFinishInMapMR-finish.txt";
pigServer.registerQuery("define MYUDF " + MyEvalFunction.class.getName() + "('MAPREDUCE','"
+ expectedFileName + "');");
pigServer.registerQuery("a = load '" + Util.encodeEscape(inputFileName) + "' using "
+ PigStorage.class.getName() + "(':');");
pigServer.registerQuery("b = foreach a generate MYUDF" + "(*);");
Iterator<Tuple> iter = pigServer.openIterator("b");
while (iter.hasNext()) {
iter.next();
}
checkAndCleanup(cluster.getExecType(), expectedFileName, inputFileName);
}
@Test
public void testFinishInReduceMR() throws Exception {
String inputFileName = setUp(cluster.getExecType());
// this file will be created on the cluster if finish() is called
String expectedFileName = "testFinishInReduceMR-finish.txt";
pigServer.registerQuery("define MYUDF " + MyEvalFunction.class.getName() + "('MAPREDUCE','"
+ expectedFileName + "');");
pigServer.registerQuery("a = load '" + Util.encodeEscape(inputFileName) + "' using "
+ PigStorage.class.getName() + "(':');");
pigServer.registerQuery("a1 = group a by $1;");
pigServer.registerQuery("b = foreach a1 generate MYUDF" + "(*);");
Iterator<Tuple> iter = pigServer.openIterator("b");
while (iter.hasNext()) {
iter.next();
}
checkAndCleanup(cluster.getExecType(), expectedFileName, inputFileName);
}
@Test
public void testFinishInMapLoc() throws Exception {
String inputFileName = setUp(ExecType.LOCAL);
// this file will be created on the cluster if finish() is called
String expectedFileName = "testFinishInMapLoc-finish.txt";
pigServer.registerQuery("define MYUDF " + MyEvalFunction.class.getName() + "('LOCAL','"
+ expectedFileName + "');");
pigServer.registerQuery("a = load '" + Util.encodeEscape(inputFileName) + "' using "
+ PigStorage.class.getName() + "(':');");
pigServer.registerQuery("b = foreach a generate MYUDF" + "(*);");
pigServer.openIterator("b");
checkAndCleanup(ExecType.LOCAL, expectedFileName, inputFileName);
}
@Test
public void testFinishInReduceLoc() throws Exception {
String inputFileName = setUp(ExecType.LOCAL);
// this file will be created on the cluster if finish() is called
String expectedFileName = "testFinishInReduceLoc-finish.txt";
pigServer.registerQuery("define MYUDF " + MyEvalFunction.class.getName() + "('LOCAL','"
+ expectedFileName + "');");
pigServer.registerQuery("a = load '" + Util.encodeEscape(inputFileName) + "' using "
+ PigStorage.class.getName() + "(':');");
pigServer.registerQuery("a1 = group a by $1;");
pigServer.registerQuery("b = foreach a1 generate MYUDF" + "(*);");
pigServer.openIterator("b");
checkAndCleanup(ExecType.LOCAL, expectedFileName, inputFileName);
}
}