blob: 19de81cd4fad0bce525b287f64dc6ace3a897db7 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pig.test;
import static org.apache.pig.builtin.mock.Storage.resetData;
import static org.apache.pig.builtin.mock.Storage.tuple;
import static org.junit.Assert.assertTrue;
import java.io.IOException;
import java.util.List;
import org.apache.pig.PigServer;
import org.apache.pig.builtin.mock.Storage.Data;
import org.apache.pig.data.Tuple;
import org.apache.pig.data.TupleFactory;
import org.junit.Before;
import org.junit.Test;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMultiset;
import com.google.common.collect.ImmutableSortedSet;
import com.google.common.collect.TreeMultiset;
import com.google.common.collect.Multiset;
public class TestRank2 {
private static PigServer pigServer;
private static TupleFactory tf = TupleFactory.getInstance();
private Data data;
@Before
public void setUp() throws Exception {
pigServer = new PigServer(Util.getLocalTestMode());
data = resetData(pigServer);
data.set("test01", tuple("A", 1, "N"), tuple("B", 2, "N"),
tuple("C", 3, "M"), tuple("D", 4, "P"), tuple("E", 4, "Q"),
tuple("E", 4, "Q"), tuple("F", 8, "Q"), tuple("F", 7, "Q"),
tuple("F", 8, "T"), tuple("F", 8, "Q"), tuple("G", 10, "V"));
data.set(
"test02",
tuple("Michael", "Blythe", 1, 1, 1, 1, 4557045.046, 98027),
tuple("Linda", "Mitchell", 2, 1, 1, 1, 5200475.231, 98027),
tuple("Jillian", "Carson", 3, 1, 1, 1, 3857163.633, 98027),
tuple("Garrett", "Vargas", 4, 1, 1, 1, 1764938.986, 98027),
tuple("Tsvi", "Reiter", 5, 1, 1, 2, 2811012.715, 98027),
tuple("Shu", "Ito", 6, 6, 2, 2, 3018725.486, 98055),
tuple("Jose", "Saraiva", 7, 6, 2, 2, 3189356.247, 98055),
tuple("David", "Campbell", 8, 6, 2, 3, 3587378.426, 98055),
tuple("Tete", "Mensa-Annan", 9, 6, 2, 3, 1931620.184, 98055),
tuple("Lynn", "Tsoflias", 10, 6, 2, 3, 1758385.926, 98055),
tuple("Rachel", "Valdez", 11, 6, 2, 4, 2241204.042, 98055),
tuple("Jae", "Pak", 12, 6, 2, 4, 5015682.375, 98055),
tuple("Ranjit", "Varkey Chudukatil", 13, 6, 2, 4,
3827950.238, 98055));
}
@Test
public void testRank01RankByDense() throws IOException {
String query = "A = LOAD 'test01' USING mock.Storage() AS (f1:chararray,f2:int,f3:chararray);"
+ "C = rank A by f3 DENSE;"
+ "store C into 'result' using mock.Storage();";
Util.registerMultiLineQuery(pigServer, query);
Multiset<Tuple> expected = ImmutableMultiset.of(
tf.newTuple(ImmutableList.of((long) 1, "C", 3, "M")),
tf.newTuple(ImmutableList.of((long) 2, "A", 1, "N")),
tf.newTuple(ImmutableList.of((long) 2, "B", 2, "N")),
tf.newTuple(ImmutableList.of((long) 3, "D", 4, "P")),
tf.newTuple(ImmutableList.of((long) 4, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "F", 7, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 5, "F", 8, "T")),
tf.newTuple(ImmutableList.of((long) 6, "G", 10, "V")));
verifyExpected(data.get("result"), expected);
}
@Test
public void testRank02RankByDense() throws IOException {
String query = "A = LOAD 'test01' USING mock.Storage() AS (f1:chararray,f2:int,f3:chararray);"
+ "C = rank A by f2 ASC DENSE;"
+ "store C into 'result' using mock.Storage();";
Util.registerMultiLineQuery(pigServer, query);
Multiset<Tuple> expected = ImmutableMultiset.of(
tf.newTuple(ImmutableList.of((long) 1, "A", 1, "N")),
tf.newTuple(ImmutableList.of((long) 2, "B", 2, "N")),
tf.newTuple(ImmutableList.of((long) 3, "C", 3, "M")),
tf.newTuple(ImmutableList.of((long) 4, "D", 4, "P")),
tf.newTuple(ImmutableList.of((long) 4, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 5, "F", 7, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "T")),
tf.newTuple(ImmutableList.of((long) 7, "G", 10, "V")));
verifyExpected(data.get("result"), expected);
}
@Test
public void testRank03RankByDense() throws IOException {
String query = "A = LOAD 'test01' USING mock.Storage() AS (f1:chararray,f2:int,f3:chararray);"
+ "C = rank A by f1 DESC DENSE;"
+ "store C into 'result' using mock.Storage();";
Util.registerMultiLineQuery(pigServer, query);
Multiset<Tuple> expected = ImmutableMultiset.of(
tf.newTuple(ImmutableList.of((long) 1, "G", 10, "V")),
tf.newTuple(ImmutableList.of((long) 2, "F", 8, "T")),
tf.newTuple(ImmutableList.of((long) 2, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 2, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 2, "F", 7, "Q")),
tf.newTuple(ImmutableList.of((long) 3, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 3, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 4, "D", 4, "P")),
tf.newTuple(ImmutableList.of((long) 5, "C", 3, "M")),
tf.newTuple(ImmutableList.of((long) 6, "B", 2, "N")),
tf.newTuple(ImmutableList.of((long) 7, "A", 1, "N")));
verifyExpected(data.get("result"), expected);
}
@Test
public void testRank04RankByDense() throws IOException {
String query = "A = LOAD 'test01' USING mock.Storage() AS (f1:chararray,f2:int,f3:chararray);"
+ "C = rank A by f1, f2 DESC DENSE;"
+ "store C into 'result' using mock.Storage();";
Util.registerMultiLineQuery(pigServer, query);
Multiset<Tuple> expected = ImmutableMultiset.of(
tf.newTuple(ImmutableList.of((long) 1, "A", 1, "N")),
tf.newTuple(ImmutableList.of((long) 2, "B", 2, "N")),
tf.newTuple(ImmutableList.of((long) 3, "C", 3, "M")),
tf.newTuple(ImmutableList.of((long) 4, "D", 4, "P")),
tf.newTuple(ImmutableList.of((long) 5, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 5, "E", 4, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "Q")),
tf.newTuple(ImmutableList.of((long) 6, "F", 8, "T")),
tf.newTuple(ImmutableList.of((long) 7, "F", 7, "Q")),
tf.newTuple(ImmutableList.of((long) 8, "G", 10, "V")));
verifyExpected(data.get("result"), expected);
}
public void verifyExpected(List<Tuple> out, Multiset<Tuple> expected) {
Multiset<Tuple> resultMultiset = TreeMultiset.create();
for (Tuple tup : out) {
resultMultiset.add(tup);
}
StringBuilder error = new StringBuilder("Result does not match.\nActual result:\n");
for (Tuple tup : resultMultiset.elementSet() ) {
error.append(tup).append(" x ").append(resultMultiset.count(tup)).append("\n");
}
error.append("Expceted result:\n");
for (Tuple tup : ImmutableSortedSet.copyOf(expected) ) {
error.append(tup).append(" x ").append(expected.count(tup)).append("\n");
}
//This one line test should be sufficient but adding the above
//for-loop for better error messages
assertTrue(error.toString(), resultMultiset.equals(expected));
}
}