blob: f566f7727a69e154d74e2e1ceb36a9f875211b8c [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.mrunit;
import static org.junit.Assert.*;
import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.io.IntWritable;
import org.apache.hadoop.io.LongWritable;
import org.apache.hadoop.io.Text;
import org.apache.hadoop.io.serializer.JavaSerializationComparator;
import org.apache.hadoop.mapred.JobConf;
import org.apache.hadoop.mapred.Mapper;
import org.apache.hadoop.mapred.Reducer;
import org.apache.hadoop.mapred.lib.IdentityMapper;
import org.apache.hadoop.mapred.lib.IdentityReducer;
import org.apache.hadoop.mapred.lib.LongSumReducer;
import org.apache.hadoop.mrunit.types.Pair;
import org.apache.hadoop.mrunit.types.UncomparableWritable;
import org.junit.Rule;
import org.junit.Test;
@SuppressWarnings("rawtypes")
public class TestPipelineMapReduceDriver {
private static final int FOO_IN_A = 42;
private static final int FOO_IN_B = 10;
private static final int BAR_IN = 12;
private static final int FOO_OUT = 52;
private static final int BAR_OUT = 12;
@Rule
public final ExpectedSuppliedException thrown = ExpectedSuppliedException
.none();
@Test
public void testEmptyPipeline() throws IOException {
thrown.expectMessage(IllegalStateException.class,
"No Mappers or Reducers in pipeline");
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver.withInput(new Text("foo"), new Text("bar")).runTest();
}
@Test
public void testUncomparable() throws IOException {
Text k = new Text("test");
Object v = new UncomparableWritable(2);
PipelineMapReduceDriver.newPipelineMapReduceDriver().withMapReduce(
new IdentityMapper<Text, Object>(),
new IdentityReducer<Text, Object>())
.withInput(k, v).withOutput(k, v).runTest();
}
@Test
public void testNoInput() throws IOException {
thrown.expectMessage(IllegalStateException.class, "No input was provided");
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver.runTest();
}
@Test
public void testSingleIdentity() throws IOException {
// Test that an identity mapper and identity reducer work
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver
.withMapReduce(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>())
.withInput(new Text("foo"), new Text("bar"))
.withOutput(new Text("foo"), new Text("bar")).runTest();
}
@Test
public void testMultipleIdentities() throws IOException {
// Test that a pipeline of identity mapper and reducers work
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver
.withMapReduce(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>())
.withMapReduce(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>())
.withMapReduce(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>())
.withInput(new Text("foo"), new Text("bar"))
.withOutput(new Text("foo"), new Text("bar")).runTest();
}
@Test
public void testSumAtEnd() throws IOException {
final PipelineMapReduceDriver<Text, LongWritable, Text, LongWritable> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new LongSumReducer<Text>())
.withInput(new Text("foo"), new LongWritable(FOO_IN_A))
.withInput(new Text("bar"), new LongWritable(BAR_IN))
.withInput(new Text("foo"), new LongWritable(FOO_IN_B))
.withOutput(new Text("bar"), new LongWritable(BAR_OUT))
.withOutput(new Text("foo"), new LongWritable(FOO_OUT)).runTest();
}
@Test
public void testSumAtEndWithInputAddAll() throws IOException {
final List<Pair<Text, LongWritable>> inputs = new ArrayList<Pair<Text, LongWritable>>();
inputs.add(new Pair<Text, LongWritable>(new Text("foo"), new LongWritable(FOO_IN_A)));
inputs.add(new Pair<Text, LongWritable>(new Text("bar"), new LongWritable(BAR_IN)));
inputs.add(new Pair<Text, LongWritable>(new Text("foo"), new LongWritable(FOO_IN_B)));
final PipelineMapReduceDriver<Text, LongWritable, Text, LongWritable> driver
= PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new LongSumReducer<Text>())
.withAll(inputs)
.withOutput(new Text("bar"), new LongWritable(BAR_OUT))
.withOutput(new Text("foo"), new LongWritable(FOO_OUT)).runTest();
}
@Test
public void testSumInMiddle() throws IOException {
final PipelineMapReduceDriver<Text, LongWritable, Text, LongWritable> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new LongSumReducer<Text>())
.withMapReduce(new IdentityMapper<Text, LongWritable>(),
new IdentityReducer<Text, LongWritable>())
.withInput(new Text("foo"), new LongWritable(FOO_IN_A))
.withInput(new Text("bar"), new LongWritable(BAR_IN))
.withInput(new Text("foo"), new LongWritable(FOO_IN_B))
.withOutput(new Text("bar"), new LongWritable(BAR_OUT))
.withOutput(new Text("foo"), new LongWritable(FOO_OUT)).runTest();
}
@Test
public void testNoMapper() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
thrown.expect(NullPointerException.class);
driver.addMapReduce(null, new IdentityReducer<Text, Text>());
driver.addInput(new Text("a"), new Text("b"));
driver.runTest();
}
@Test
public void testNoReducer() throws IOException {
final List<Pair<Mapper, Reducer>> pipeline = new ArrayList<Pair<Mapper, Reducer>>();
pipeline.add(new Pair<Mapper, Reducer>(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>()));
pipeline.add(null);
pipeline.add(new Pair<Mapper, Reducer>(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>()));
thrown.expectMessage(NullPointerException.class, "entry 1 in list is null");
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver
.newPipelineMapReduceDriver(pipeline);
driver.addInput(new Text("a"), new Text("b"));
driver.runTest();
}
@Test
public void testWithCounter() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.withInput(new Text("hie"), new Text("Hi"))
.withOutput(new Text("hie"), new Text("Hi"))
.withCounter(TestMapDriver.MapperWithCounters.Counters.X, 2)
.withCounter("category", "name", 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.COUNT, 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.SUM, 2)
.withCounter("category", "count", 2).withCounter("category", "sum", 2)
.runTest();
}
@Test
public void testWithCounterAndNoneMissing() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.withInput(new Text("hie"), new Text("Hi"))
.withOutput(new Text("hie"), new Text("Hi"))
.withStrictCounterChecking()
.withCounter(TestMapDriver.MapperWithCounters.Counters.X, 2)
.withCounter("category", "name", 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.COUNT, 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.SUM, 2)
.withCounter("category", "count", 2).withCounter("category", "sum", 2)
.runTest();
}
@Test
public void testWithCounterAndEnumCounterMissing() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
thrown
.expectAssertionErrorMessage("1 Error(s): (Actual counter ("
+ "\"org.apache.hadoop.mrunit.TestMapDriver$MapperWithCounters$Counters\",\"X\")"
+ " was not found in expected counters");
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.withInput(new Text("hie"), new Text("Hi"))
.withOutput(new Text("hie"), new Text("Hi"))
.withStrictCounterChecking()
.withCounter("category", "name", 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.COUNT, 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.SUM, 2)
.withCounter("category", "count", 2).withCounter("category", "sum", 2)
.runTest();
}
@Test
public void testWithCounterAndStringCounterMissing() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
thrown
.expectAssertionErrorMessage("1 Error(s): (Actual counter ("
+ "\"category\",\"name\")"
+ " was not found in expected counters");
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.withInput(new Text("hie"), new Text("Hi"))
.withOutput(new Text("hie"), new Text("Hi"))
.withStrictCounterChecking()
.withCounter(TestMapDriver.MapperWithCounters.Counters.X, 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.COUNT, 2)
.withCounter(TestReduceDriver.ReducerWithCounters.Counters.SUM, 2)
.withCounter("category", "count", 2).withCounter("category", "sum", 2)
.runTest();
}
@Test
public void testWithFailedCounter() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver.newPipelineMapReduceDriver();
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
driver.addMapReduce(
new TestMapDriver.MapperWithCounters<Text, Text, Text, Text>(),
new TestReduceDriver.ReducerWithCounters<Text, Text, Text, Text>());
thrown
.expectAssertionErrorMessage("2 Error(s): ("
+ "Counter org.apache.hadoop.mrunit.TestMapDriver.MapperWithCounters.Counters.X has value 2 instead of expected 20, "
+ "Counter with category category and name name has value 2 instead of expected 20)");
driver.withInput(new Text("hie"), new Text("Hi"))
.withOutput(new Text("hie"), new Text("Hi"))
.withCounter(TestMapDriver.MapperWithCounters.Counters.X, 20)
.withCounter("category", "name", 20).runTest();
}
@Test
public void testJavaSerialization() throws IOException {
final JobConf conf = new JobConf();
conf.setStrings("io.serializations", conf.get("io.serializations"),
"org.apache.hadoop.io.serializer.JavaSerialization");
conf.setOutputKeyComparatorClass(JavaSerializationComparator.class);
conf.setOutputValueGroupingComparator(TestMapReduceDriver.INTEGER_COMPARATOR
.getClass());
final PipelineMapReduceDriver<Integer, IntWritable, Integer, IntWritable> driver = PipelineMapReduceDriver
.newPipelineMapReduceDriver();
driver.addMapReduce(new IdentityMapper<Integer, IntWritable>(),
new IdentityReducer<Integer, IntWritable>());
driver.addMapReduce(new IdentityMapper<Integer, IntWritable>(),
new IdentityReducer<Integer, IntWritable>());
driver.withConfiguration(conf);
driver.withInput(1, new IntWritable(2)).withInput(2, new IntWritable(3));
driver.withOutput(1, new IntWritable(2)).withOutput(2, new IntWritable(3));
driver.runTest();
}
@Test
public void testCopy() throws IOException {
final PipelineMapReduceDriver<Text, Text, Text, Text> driver = PipelineMapReduceDriver
.newPipelineMapReduceDriver();
driver.withMapReduce(new IdentityMapper<Text, Text>(),
new IdentityReducer<Text, Text>());
final Text key = new Text("a");
final Text value = new Text("b");
driver.addInput(key, value);
key.set("c");
value.set("d");
driver.addInput(key, value);
key.set("a");
value.set("b");
driver.addOutput(key, value);
key.set("c");
value.set("d");
driver.addOutput(key, value);
driver.runTest();
}
@Test
public void testMapInputFile() throws IOException {
InputPathStoringMapper<LongWritable,LongWritable> mapper =
new InputPathStoringMapper<LongWritable,LongWritable>();
Path mapInputPath = new Path("myfile");
final PipelineMapReduceDriver<Text, LongWritable, Text, LongWritable> driver = PipelineMapReduceDriver
.newPipelineMapReduceDriver();
driver.addMapReduce(mapper, new IdentityReducer<Text, LongWritable>());
driver.setMapInputPath(mapInputPath);
assertEquals(mapInputPath.getName(), driver.getMapInputPath().getName());
driver.withInput(new Text("a"), new LongWritable(1));
driver.runTest();
assertNotNull(mapper.getMapInputPath());
assertEquals(mapInputPath.getName(), mapper.getMapInputPath().getName());
}
}