blob: ed5c1ba7dcd1f9dce34ab68a2805cd4bedfb09e7 [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pig.builtin;
import static org.apache.pig.builtin.mock.Storage.resetData;
import static org.apache.pig.builtin.mock.Storage.tuple;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;
import java.util.Iterator;
import org.apache.pig.PigServer;
import org.apache.pig.builtin.mock.Storage.Data;
import org.apache.pig.data.Tuple;
import org.apache.pig.impl.logicalLayer.schema.Schema;
import org.apache.pig.impl.util.Utils;
import org.apache.pig.test.Util;
import org.junit.Before;
import org.junit.Test;
public class TestPluckTuple {
private PigServer pigServer;
@Before
public void setUp() throws Exception {
pigServer = new PigServer(Util.getLocalTestMode());
}
@Test
public void testStartsWith() throws Exception {
String query = "a = load 'a' as (x:int,y:chararray,z:long);" +
"b = load 'b' as (x:int,y:chararray,z:long);" +
"c = join a by x, b by x;" +
"define pluck PluckTuple('a::');" +
"d = foreach c generate flatten(pluck(*));";
pigServer.registerQuery(query);
assertTrue(Schema.equals(pigServer.dumpSchema("a"), pigServer.dumpSchema("d"), false, true));
}
@Test
public void testNegativeStartsWith() throws Exception {
String query = "a = load 'a' as (x:int,y:chararray,z:long);" +
"b = load 'b' as (x:int,y:chararray,z:long);" +
"c = join a by x, b by x;" +
"define pluck PluckTuple('a::','false');" +
"d = foreach c generate flatten(pluck(*));";
pigServer.registerQuery(query);
assertTrue(Schema.equals(pigServer.dumpSchema("b"), pigServer.dumpSchema("d"), false, true));
}
@Test
public void testPatternMatches() throws Exception {
String query = "a1 = load 'a1' as (x:int,y:chararray,z:long);" +
"a2 = load 'a2' as (x:int,y:chararray,z:long);" +
"b = join a1 by x, a2 by x;" +
"define pluck PluckTuple('a[2|3]::.*');" +
"c = foreach b generate flatten(pluck(*));";
pigServer.registerQuery(query);
assertTrue(Schema.equals(pigServer.dumpSchema("a2"), pigServer.dumpSchema("c"), false, true));
}
@Test
public void testNegativePatternMatches() throws Exception {
String query = "a1 = load 'a1' as (x:int,y:chararray,z:long);" +
"a2 = load 'a2' as (x:int,y:chararray,z:long);" +
"b = join a1 by x, a2 by x;" +
"define pluck PluckTuple('a[2|3]::.*','false');" +
"c = foreach b generate flatten(pluck(*));";
pigServer.registerQuery(query);
assertTrue(Schema.equals(pigServer.dumpSchema("a1"), pigServer.dumpSchema("c"), false, true));
}
@Test
public void testOutput() throws Exception {
Data data = resetData(pigServer);
Tuple exp1 = tuple(1, "hey", 2L);
Tuple exp2 = tuple(2, "woah", 3L);
data.set("a",
Utils.getSchemaFromString("x:int,y:chararray,z:long"),
exp1,
exp2,
tuple(3, "c", 4L)
);
data.set("b",
Utils.getSchemaFromString("x:int,y:chararray,z:long"),
tuple(1, "sasf", 5L),
tuple(2, "woah", 6L),
tuple(4, "c", 7L)
);
String query = "a = load 'a' using mock.Storage();" +
"b = load 'b' using mock.Storage();" +
"c = join a by x, b by x;" +
"define pluck PluckTuple('a::');" +
"d = foreach c generate flatten(pluck(*));";
pigServer.registerQuery(query);
Iterator<Tuple> it = pigServer.openIterator("d");
assertTrue(it.hasNext());
assertEquals(exp1, it.next());
assertTrue(it.hasNext());
assertEquals(exp2, it.next());
assertFalse(it.hasNext());
}
@Test
public void testTwoPluckTuples() throws Exception {
Data data = resetData(pigServer);
data.set("a",
Utils.getSchemaFromString("xa:int,yb:chararray,zc:long"),
tuple(1, "hey", 3L),
tuple(2, "woah", 4L)
);
String query = "a = load 'a' using mock.Storage();" +
"define pluck1 PluckTuple('.a');" +
"define pluck2 PluckTuple('.b');" +
"b = foreach a generate flatten(pluck1(*)), flatten(pluck2(*));";
pigServer.registerQuery(query);
Iterator<Tuple> it = pigServer.openIterator("b");
assertTrue(it.hasNext());
assertEquals(tuple(1,"hey"), it.next());
assertTrue(it.hasNext());
assertEquals(tuple(2,"woah"), it.next());
assertFalse(it.hasNext());
}
@Test
public void testNegativeOutput() throws Exception {
Data data = resetData(pigServer);
Tuple exp1 = tuple(1, "sasf", 5L);
Tuple exp2 = tuple(2, "woah", 6L);
data.set("a",
Utils.getSchemaFromString("x:int,y:chararray,z:long"),
tuple(1, "hey", 2L),
tuple(2, "woah", 3L),
tuple(3, "c", 4L)
);
data.set("b",
Utils.getSchemaFromString("x:int,y:chararray,z:long"),
exp1,
exp2,
tuple(4, "c", 7L)
);
String query = "a = load 'a' using mock.Storage();" +
"b = load 'b' using mock.Storage();" +
"c = join a by x, b by x;" +
"define pluck PluckTuple('a::','false');" +
"d = foreach c generate flatten(pluck(*));";
pigServer.registerQuery(query);
Iterator<Tuple> it = pigServer.openIterator("d");
assertTrue(it.hasNext());
assertEquals(exp1, it.next());
assertTrue(it.hasNext());
assertEquals(exp2, it.next());
assertFalse(it.hasNext());
}
}