blob: bc4382e05136336ec010646da53e16cf497dfd6a [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tajo.engine.planner.physical;
import com.google.common.base.Preconditions;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.tajo.catalog.CatalogUtil;
import org.apache.tajo.catalog.Column;
import org.apache.tajo.catalog.TableMeta;
import org.apache.tajo.catalog.statistics.TableStats;
import org.apache.tajo.conf.TajoConf.ConfVars;
import org.apache.tajo.plan.logical.ShuffleFileWriteNode;
import org.apache.tajo.storage.HashShuffleAppender;
import org.apache.tajo.storage.HashShuffleAppenderManager;
import org.apache.tajo.storage.Tuple;
import org.apache.tajo.worker.TaskAttemptContext;
import java.io.IOException;
import java.util.HashMap;
import java.util.Map;
/**
* <code>HashShuffleFileWriteExec</code> is a physical executor to store intermediate data into a number of
* file outputs associated with shuffle keys. The file outputs are stored on local disks.
*/
public final class HashShuffleFileWriteExec extends UnaryPhysicalExec {
private static Log LOG = LogFactory.getLog(HashShuffleFileWriteExec.class);
private ShuffleFileWriteNode plan;
private final TableMeta meta;
private Partitioner partitioner;
private Map<Integer, HashShuffleAppender> appenderMap = new HashMap<Integer, HashShuffleAppender>();
private final int numShuffleOutputs;
private final int [] shuffleKeyIds;
private HashShuffleAppenderManager hashShuffleAppenderManager;
private int numHashShuffleBufferTuples;
public HashShuffleFileWriteExec(TaskAttemptContext context,
final ShuffleFileWriteNode plan, final PhysicalExec child) throws IOException {
super(context, plan.getInSchema(), plan.getOutSchema(), child);
Preconditions.checkArgument(plan.hasShuffleKeys());
this.plan = plan;
if (plan.hasOptions()) {
this.meta = CatalogUtil.newTableMeta(plan.getStorageType(), plan.getOptions());
} else {
this.meta = CatalogUtil.newTableMeta(plan.getStorageType());
}
// about the shuffle
this.numShuffleOutputs = this.plan.getNumOutputs();
int i = 0;
this.shuffleKeyIds = new int [this.plan.getShuffleKeys().length];
for (Column key : this.plan.getShuffleKeys()) {
shuffleKeyIds[i] = inSchema.getColumnId(key.getQualifiedName());
i++;
}
this.partitioner = new HashPartitioner(shuffleKeyIds, numShuffleOutputs);
this.hashShuffleAppenderManager = context.getHashShuffleAppenderManager();
this.numHashShuffleBufferTuples = context.getConf().getIntVar(ConfVars.SHUFFLE_HASH_APPENDER_BUFFER_SIZE);
}
@Override
public void init() throws IOException {
super.init();
}
private HashShuffleAppender getAppender(int partId) throws IOException {
HashShuffleAppender appender = appenderMap.get(partId);
if (appender == null) {
appender = hashShuffleAppenderManager.getAppender(context.getConf(),
context.getTaskId().getTaskId().getExecutionBlockId(), partId, meta, outSchema);
appenderMap.put(partId, appender);
}
return appender;
}
Map<Integer, TupleList> partitionTuples = new HashMap<Integer, TupleList>();
long writtenBytes = 0L;
@Override
public Tuple next() throws IOException {
try {
Tuple tuple;
int partId;
int tupleCount = 0;
long numRows = 0;
while (!context.isStopped() && (tuple = child.next()) != null) {
tupleCount++;
numRows++;
partId = partitioner.getPartition(tuple);
TupleList partitionTupleList = partitionTuples.get(partId);
if (partitionTupleList == null) {
partitionTupleList = new TupleList(1000);
partitionTuples.put(partId, partitionTupleList);
}
partitionTupleList.add(tuple);
if (tupleCount >= numHashShuffleBufferTuples) {
for (Map.Entry<Integer, TupleList> entry : partitionTuples.entrySet()) {
int appendPartId = entry.getKey();
HashShuffleAppender appender = getAppender(appendPartId);
int appendedSize = appender.addTuples(context.getTaskId(), entry.getValue());
writtenBytes += appendedSize;
entry.getValue().clear();
}
tupleCount = 0;
}
}
// processing remained tuples
for (Map.Entry<Integer, TupleList> entry : partitionTuples.entrySet()) {
int appendPartId = entry.getKey();
HashShuffleAppender appender = getAppender(appendPartId);
int appendedSize = appender.addTuples(context.getTaskId(), entry.getValue());
writtenBytes += appendedSize;
entry.getValue().clear();
}
TableStats aggregated = (TableStats) child.getInputStats().clone();
aggregated.setNumBytes(writtenBytes);
aggregated.setNumRows(numRows);
context.setResultStats(aggregated);
partitionTuples.clear();
return null;
} catch (RuntimeException e) {
LOG.error(e.getMessage(), e);
throw new IOException(e);
} catch (Exception e) {
LOG.error(e.getMessage(), e);
throw new IOException(e);
}
}
@Override
public void rescan() throws IOException {
// nothing to do
}
@Override
public void close() throws IOException{
super.close();
if (appenderMap != null) {
appenderMap.clear();
appenderMap = null;
}
for (TupleList eachList : partitionTuples.values()) {
eachList.clear();
}
partitionTuples.clear();
partitionTuples = null;
partitioner = null;
plan = null;
progress = 1.0f;
}
}