blob: 7fd249dd17dd1865501fe0792c7658e7b828e90c [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tajo.engine.planner;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.LocatedFileStatus;
import org.apache.hadoop.fs.Path;
import org.apache.hadoop.fs.RemoteIterator;
import org.apache.tajo.BuiltinStorages;
import org.apache.tajo.LocalTajoTestingUtility;
import org.apache.tajo.TajoConstants;
import org.apache.tajo.TajoTestingCluster;
import org.apache.tajo.algebra.Expr;
import org.apache.tajo.catalog.*;
import org.apache.tajo.catalog.proto.CatalogProtos.FragmentProto;
import org.apache.tajo.catalog.proto.CatalogProtos.FunctionType;
import org.apache.tajo.common.TajoDataTypes.Type;
import org.apache.tajo.datum.DatumFactory;
import org.apache.tajo.engine.function.builtin.SumInt;
import org.apache.tajo.parser.sql.SQLAnalyzer;
import org.apache.tajo.engine.planner.physical.PhysicalPlanUtil;
import org.apache.tajo.exception.TajoException;
import org.apache.tajo.plan.LogicalPlanner;
import org.apache.tajo.plan.expr.*;
import org.apache.tajo.plan.logical.*;
import org.apache.tajo.plan.util.PlannerUtil;
import org.apache.tajo.storage.TablespaceManager;
import org.apache.tajo.storage.Tuple;
import org.apache.tajo.storage.TupleComparator;
import org.apache.tajo.storage.VTuple;
import org.apache.tajo.storage.fragment.FileFragment;
import org.apache.tajo.storage.fragment.FragmentConvertor;
import org.apache.tajo.util.CommonTestingUtil;
import org.apache.tajo.util.KeyValueSet;
import org.junit.AfterClass;
import org.junit.BeforeClass;
import org.junit.Test;
import java.util.ArrayList;
import java.util.List;
import static org.apache.tajo.TajoConstants.DEFAULT_DATABASE_NAME;
import static org.apache.tajo.TajoConstants.DEFAULT_TABLESPACE_NAME;
import static org.junit.Assert.*;
public class TestPlannerUtil {
private static TajoTestingCluster util;
private static CatalogService catalog;
private static SQLAnalyzer analyzer;
private static LogicalPlanner planner;
@BeforeClass
public static void setUp() throws Exception {
util = new TajoTestingCluster();
util.startCatalogCluster();
catalog = util.getCatalogService();
catalog.createTablespace(DEFAULT_TABLESPACE_NAME, "hdfs://localhost:1234/warehouse");
catalog.createDatabase(DEFAULT_DATABASE_NAME, DEFAULT_TABLESPACE_NAME);
Schema schema = SchemaBuilder.builder()
.add("name", Type.TEXT)
.add("empid", CatalogUtil.newSimpleDataType(Type.INT4))
.add("deptname", Type.TEXT).build();
Schema schema2 = SchemaBuilder.builder()
.add("deptname", Type.TEXT)
.add("manager", Type.TEXT).build();
Schema schema3 = SchemaBuilder.builder()
.add("deptname", Type.TEXT)
.add("score", CatalogUtil.newSimpleDataType(Type.INT4)).build();
TableMeta meta = CatalogUtil.newTableMeta(BuiltinStorages.TEXT, util.getConfiguration());
TableDesc people = new TableDesc(
CatalogUtil.buildFQName(TajoConstants.DEFAULT_DATABASE_NAME, "employee"), schema, meta,
CommonTestingUtil.getTestDir().toUri());
catalog.createTable(people);
TableDesc student =
new TableDesc(
CatalogUtil.buildFQName(DEFAULT_DATABASE_NAME, "dept"), schema2, "TEXT",
new KeyValueSet(), CommonTestingUtil.getTestDir().toUri());
catalog.createTable(student);
TableDesc score =
new TableDesc(
CatalogUtil.buildFQName(DEFAULT_DATABASE_NAME, "score"), schema3, "TEXT",
new KeyValueSet(), CommonTestingUtil.getTestDir().toUri());
catalog.createTable(score);
FunctionDesc funcDesc = new FunctionDesc("sumtest", SumInt.class, FunctionType.AGGREGATION,
CatalogUtil.newSimpleDataType(Type.INT4),
CatalogUtil.newSimpleDataTypeArray(Type.INT4));
catalog.createFunction(funcDesc);
analyzer = new SQLAnalyzer();
planner = new LogicalPlanner(catalog, TablespaceManager.getInstance());
}
@AfterClass
public static void tearDown() throws Exception {
util.shutdownCatalogCluster();
}
@Test
public final void testFindTopNode() throws CloneNotSupportedException, TajoException {
// two relations
Expr expr = analyzer.parse(TestLogicalPlanner.QUERIES[1]);
LogicalNode plan = planner.createPlan(LocalTajoTestingUtility.createDummyContext(util.getConfiguration()),
expr).getRootBlock().getRoot();
assertEquals(NodeType.ROOT, plan.getType());
LogicalRootNode root = (LogicalRootNode) plan;
TestLogicalPlanner.testCloneLogicalNode(root);
assertEquals(NodeType.PROJECTION, root.getChild().getType());
ProjectionNode projNode = root.getChild();
assertEquals(NodeType.JOIN, projNode.getChild().getType());
JoinNode joinNode = projNode.getChild();
assertEquals(NodeType.SCAN, joinNode.getLeftChild().getType());
ScanNode leftNode = joinNode.getLeftChild();
assertEquals("default.employee", leftNode.getTableName());
assertEquals(NodeType.SCAN, joinNode.getRightChild().getType());
ScanNode rightNode = joinNode.getRightChild();
assertEquals("default.dept", rightNode.getTableName());
LogicalNode node = PlannerUtil.findTopNode(root, NodeType.ROOT);
assertEquals(NodeType.ROOT, node.getType());
node = PlannerUtil.findTopNode(root, NodeType.PROJECTION);
assertEquals(NodeType.PROJECTION, node.getType());
node = PlannerUtil.findTopNode(root, NodeType.JOIN);
assertEquals(NodeType.JOIN, node.getType());
node = PlannerUtil.findTopNode(root, NodeType.SCAN);
assertEquals(NodeType.SCAN, node.getType());
}
@Test
public final void testIsJoinQual() {
FieldEval f1 = new FieldEval("part.p_partkey", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f2 = new FieldEval("partsupp.ps_partkey",
CatalogUtil.newSimpleDataType(Type.INT4));
BinaryEval [] joinQuals = new BinaryEval[5];
int idx = 0;
joinQuals[idx++] = new BinaryEval(EvalType.EQUAL, f1, f2);
joinQuals[idx++] = new BinaryEval(EvalType.LEQ, f1, f2);
joinQuals[idx++] = new BinaryEval(EvalType.LTH, f1, f2);
joinQuals[idx++] = new BinaryEval(EvalType.GEQ, f1, f2);
joinQuals[idx] = new BinaryEval(EvalType.GTH, f1, f2);
for (int i = 0; i < idx; i++) {
assertTrue(EvalTreeUtil.isJoinQual(joinQuals[idx], true));
}
BinaryEval [] wrongJoinQuals = new BinaryEval[5];
idx = 0;
wrongJoinQuals[idx++] = new BinaryEval(EvalType.OR, f1, f2);
wrongJoinQuals[idx++] = new BinaryEval(EvalType.PLUS, f1, f2);
wrongJoinQuals[idx++] = new BinaryEval(EvalType.LIKE, f1, f2);
ConstEval f3 = new ConstEval(DatumFactory.createInt4(1));
wrongJoinQuals[idx] = new BinaryEval(EvalType.EQUAL, f1, f3);
for (int i = 0; i < idx; i++) {
assertFalse(EvalTreeUtil.isJoinQual(wrongJoinQuals[idx], true));
}
}
@Test
public final void testGetJoinKeyPairs() {
Schema outerSchema = SchemaBuilder.builder()
.add("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4)).build();
Schema innerSchema = SchemaBuilder.builder()
.add("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4)).build();
FieldEval f1 = new FieldEval("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f2 = new FieldEval("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f3 = new FieldEval("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f4 = new FieldEval("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4));
EvalNode equiJoinQual = new BinaryEval(EvalType.EQUAL, f1, f2);
// the case where part is the outer and partsupp is the inner.
List<Column[]> pairs = PlannerUtil.getJoinKeyPairs(equiJoinQual, outerSchema, innerSchema, false);
assertEquals(1, pairs.size());
assertEquals("employee.id1", pairs.get(0)[0].getQualifiedName());
assertEquals("people.fid1", pairs.get(0)[1].getQualifiedName());
// after exchange of outer and inner
pairs = PlannerUtil.getJoinKeyPairs(equiJoinQual, innerSchema, outerSchema, false);
assertEquals("people.fid1", pairs.get(0)[0].getQualifiedName());
assertEquals("employee.id1", pairs.get(0)[1].getQualifiedName());
// composited join key test
EvalNode joinQual2 = new BinaryEval(EvalType.EQUAL, f3, f4);
EvalNode compositedJoinQual = new BinaryEval(EvalType.AND, equiJoinQual, joinQual2);
pairs = PlannerUtil.getJoinKeyPairs(compositedJoinQual, outerSchema, innerSchema, false);
assertEquals(2, pairs.size());
assertEquals("employee.id1", pairs.get(0)[0].getQualifiedName());
assertEquals("people.fid1", pairs.get(0)[1].getQualifiedName());
assertEquals("employee.id2", pairs.get(1)[0].getQualifiedName());
assertEquals("people.fid2", pairs.get(1)[1].getQualifiedName());
// after exchange of outer and inner
pairs = PlannerUtil.getJoinKeyPairs(compositedJoinQual, innerSchema, outerSchema, false);
assertEquals(2, pairs.size());
assertEquals("people.fid1", pairs.get(0)[0].getQualifiedName());
assertEquals("employee.id1", pairs.get(0)[1].getQualifiedName());
assertEquals("people.fid2", pairs.get(1)[0].getQualifiedName());
assertEquals("employee.id2", pairs.get(1)[1].getQualifiedName());
// Theta join (f1 <= f2)
EvalNode thetaJoinQual = new BinaryEval(EvalType.LEQ, f1, f2);
pairs = PlannerUtil.getJoinKeyPairs(thetaJoinQual, outerSchema, innerSchema, true);
assertEquals(1, pairs.size());
assertEquals("employee.id1", pairs.get(0)[0].getQualifiedName());
assertEquals("people.fid1", pairs.get(0)[1].getQualifiedName());
// Composite Theta join (f1 <= f2 AND f3 = f4)
EvalNode compositeThetaJoin = new BinaryEval(EvalType.AND, thetaJoinQual, joinQual2);
pairs = PlannerUtil.getJoinKeyPairs(compositeThetaJoin, outerSchema, innerSchema, true);
assertEquals(2, pairs.size());
assertEquals("employee.id1", pairs.get(0)[0].getQualifiedName());
assertEquals("people.fid1", pairs.get(0)[1].getQualifiedName());
assertEquals("employee.id2", pairs.get(1)[0].getQualifiedName());
assertEquals("people.fid2", pairs.get(1)[1].getQualifiedName());
}
@Test
public final void testGetSortKeysFromJoinQual() {
Schema outerSchema = SchemaBuilder.builder()
.add("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4))
.build();
Schema innerSchema = SchemaBuilder.builder()
.add("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4))
.build();
FieldEval f1 = new FieldEval("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f2 = new FieldEval("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f3 = new FieldEval("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f4 = new FieldEval("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4));
EvalNode joinQual = new BinaryEval(EvalType.EQUAL, f1, f2);
SortSpec[][] sortSpecs = PlannerUtil.getSortKeysFromJoinQual(joinQual, outerSchema, innerSchema);
assertEquals(2, sortSpecs.length);
assertEquals(1, sortSpecs[0].length);
assertEquals(1, sortSpecs[1].length);
assertEquals(outerSchema.getColumn("id1"), sortSpecs[0][0].getSortKey());
assertEquals(innerSchema.getColumn("fid1"), sortSpecs[1][0].getSortKey());
// tests for composited join key
EvalNode joinQual2 = new BinaryEval(EvalType.EQUAL, f3, f4);
EvalNode compositedJoinQual = new BinaryEval(EvalType.AND, joinQual, joinQual2);
sortSpecs = PlannerUtil.getSortKeysFromJoinQual(compositedJoinQual, outerSchema, innerSchema);
assertEquals(2, sortSpecs.length);
assertEquals(2, sortSpecs[0].length);
assertEquals(2, sortSpecs[1].length);
assertEquals(outerSchema.getColumn("id1"), sortSpecs[0][0].getSortKey());
assertEquals(outerSchema.getColumn("id2"), sortSpecs[0][1].getSortKey());
assertEquals(innerSchema.getColumn("fid1"), sortSpecs[1][0].getSortKey());
assertEquals(innerSchema.getColumn("fid2"), sortSpecs[1][1].getSortKey());
}
@Test
public final void testComparatorsFromJoinQual() {
Schema outerSchema = SchemaBuilder.builder()
.add("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4))
.build();
Schema innerSchema = SchemaBuilder.builder()
.add("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4))
.add("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4))
.build();
FieldEval f1 = new FieldEval("employee.id1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f2 = new FieldEval("people.fid1", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f3 = new FieldEval("employee.id2", CatalogUtil.newSimpleDataType(Type.INT4));
FieldEval f4 = new FieldEval("people.fid2", CatalogUtil.newSimpleDataType(Type.INT4));
EvalNode joinQual = new BinaryEval(EvalType.EQUAL, f1, f2);
TupleComparator[] comparators = PhysicalPlanUtil.getComparatorsFromJoinQual(joinQual, outerSchema, innerSchema);
Tuple t1 = new VTuple(2);
t1.put(0, DatumFactory.createInt4(1));
t1.put(1, DatumFactory.createInt4(2));
Tuple t2 = new VTuple(2);
t2.put(0, DatumFactory.createInt4(2));
t2.put(1, DatumFactory.createInt4(3));
TupleComparator outerComparator = comparators[0];
assertTrue(outerComparator.compare(t1, t2) < 0);
assertTrue(outerComparator.compare(t2, t1) > 0);
TupleComparator innerComparator = comparators[1];
assertTrue(innerComparator.compare(t1, t2) < 0);
assertTrue(innerComparator.compare(t2, t1) > 0);
// tests for composited join key
EvalNode joinQual2 = new BinaryEval(EvalType.EQUAL, f3, f4);
EvalNode compositedJoinQual = new BinaryEval(EvalType.AND, joinQual, joinQual2);
comparators = PhysicalPlanUtil.getComparatorsFromJoinQual(compositedJoinQual, outerSchema, innerSchema);
outerComparator = comparators[0];
assertTrue(outerComparator.compare(t1, t2) < 0);
assertTrue(outerComparator.compare(t2, t1) > 0);
innerComparator = comparators[1];
assertTrue(innerComparator.compare(t1, t2) < 0);
assertTrue(innerComparator.compare(t2, t1) > 0);
}
@Test
public void testGetNonZeroLengthDataFiles() throws Exception {
String queryFiles = ClassLoader.getSystemResource("queries").toString() + "/TestSelectQuery";
Path path = new Path(queryFiles);
TableDesc tableDesc = new TableDesc();
tableDesc.setName("Test");
tableDesc.setUri(path.toUri());
FileSystem fs = path.getFileSystem(util.getConfiguration());
List<Path> expectedFiles = new ArrayList<>();
RemoteIterator<LocatedFileStatus> files = fs.listFiles(path, true);
while (files.hasNext()) {
LocatedFileStatus file = files.next();
if (file.isFile() && file.getLen() > 0) {
expectedFiles.add(file.getPath());
}
}
int fileNum = expectedFiles.size() / 5;
int numResultFiles = 0;
for (int i = 0; i <= 5; i++) {
int start = i * fileNum;
FragmentProto[] fragments =
PhysicalPlanUtil.getNonZeroLengthDataFiles(util.getConfiguration(), tableDesc, start, fileNum);
assertNotNull(fragments);
numResultFiles += fragments.length;
int expectedSize = fileNum;
if (i == 5) {
//last
expectedSize = expectedFiles.size() - (fileNum * 5);
}
comparePath(expectedFiles, fragments, start, expectedSize);
}
assertEquals(expectedFiles.size(), numResultFiles);
}
private void comparePath(List<Path> expectedFiles, FragmentProto[] fragments,
int startIndex, int expectedSize) throws Exception {
assertEquals(expectedSize, fragments.length);
int index = 0;
for (int i = startIndex; i < startIndex + expectedSize; i++, index++) {
FileFragment fragment = FragmentConvertor.convert(util.getConfiguration(), fragments[index]);
assertEquals(expectedFiles.get(i), fragment.getPath());
}
}
}