blob: d40bd6d9c3abcc95d81e1e503c265d815ae328fb [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* See the License for the specific language governing permissions and
* limitations under the License.
package org.apache.drill.exec.physical.impl.unorderedreceiver;
import io.netty.buffer.ByteBuf;
import java.util.Iterator;
import org.apache.drill.common.expression.SchemaPath;
import org.apache.drill.exec.exception.OutOfMemoryException;
import org.apache.drill.exec.exception.SchemaChangeException;
import org.apache.drill.exec.ops.ExchangeFragmentContext;
import org.apache.drill.exec.ops.FragmentContext;
import org.apache.drill.exec.ops.MetricDef;
import org.apache.drill.exec.ops.OperatorContext;
import org.apache.drill.exec.ops.OperatorStats;
import org.apache.drill.exec.physical.MinorFragmentEndpoint;
import org.apache.drill.exec.physical.config.UnorderedReceiver;
import org.apache.drill.exec.proto.BitControl.FinishedReceiver;
import org.apache.drill.exec.proto.ExecProtos.FragmentHandle;
import org.apache.drill.exec.proto.GeneralRPCProtos.Ack;
import org.apache.drill.exec.proto.UserBitShared.RecordBatchDef;
import org.apache.drill.exec.record.BatchSchema;
import org.apache.drill.exec.record.CloseableRecordBatch;
import org.apache.drill.exec.record.RawFragmentBatch;
import org.apache.drill.exec.record.RawFragmentBatchProvider;
import org.apache.drill.exec.record.RecordBatchLoader;
import org.apache.drill.exec.record.TypedFieldId;
import org.apache.drill.exec.record.VectorContainer;
import org.apache.drill.exec.record.VectorWrapper;
import org.apache.drill.exec.record.WritableBatch;
import org.apache.drill.exec.record.selection.SelectionVector2;
import org.apache.drill.exec.record.selection.SelectionVector4;
import org.apache.drill.exec.rpc.RpcException;
import org.apache.drill.exec.rpc.RpcOutcomeListener;
import org.apache.drill.exec.testing.ControlsInjector;
import org.apache.drill.exec.testing.ControlsInjectorFactory;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
public class UnorderedReceiverBatch implements CloseableRecordBatch {
private static final Logger logger = LoggerFactory.getLogger(UnorderedReceiverBatch.class);
private static final ControlsInjector injector = ControlsInjectorFactory.getInjector(UnorderedReceiverBatch.class);
private final RecordBatchLoader batchLoader;
private final RawFragmentBatchProvider fragProvider;
private final ExchangeFragmentContext context;
private BatchSchema schema;
private final OperatorStats stats;
private boolean first = true;
private final UnorderedReceiver config;
private final OperatorContext oContext;
// Represents last outcome of next(). If an Exception is thrown
// during the method's execution a value IterOutcome.STOP will be assigned.
private IterOutcome lastOutcome;
public enum Metric implements MetricDef {
public int metricId() {
return ordinal();
public UnorderedReceiverBatch(ExchangeFragmentContext context,
RawFragmentBatchProvider fragProvider, UnorderedReceiver config)
throws OutOfMemoryException {
this.fragProvider = fragProvider;
this.context = context;
// In normal case, batchLoader does not require an allocator. However, in
// case of splitAndTransfer of a value vector,
// we may need an allocator for the new offset vector. Therefore, here we
// pass the context's allocator to batchLoader.
oContext = context.newOperatorContext(config);
this.batchLoader = new RecordBatchLoader(oContext.getAllocator());
this.stats = oContext.getStats();
this.stats.setLongStat(Metric.NUM_SENDERS, config.getNumSenders());
this.config = config;
// Register this operator's buffer allocator so that incoming buffers are
// owned by this allocator
public FragmentContext getContext() {
return context;
public BatchSchema getSchema() {
return schema;
public int getRecordCount() {
return batchLoader.getRecordCount();
public void kill(boolean sendUpstream) {
if (sendUpstream) {
public Iterator<VectorWrapper<?>> iterator() {
return batchLoader.iterator();
public SelectionVector2 getSelectionVector2() {
throw new UnsupportedOperationException();
public SelectionVector4 getSelectionVector4() {
throw new UnsupportedOperationException();
public TypedFieldId getValueVectorId(SchemaPath path) {
return batchLoader.getValueVectorId(path);
public VectorWrapper<?> getValueAccessorById(Class<?> clazz, int... ids) {
return batchLoader.getValueAccessorById(clazz, ids);
private RawFragmentBatch getNextBatch() throws IOException {
try {
injector.injectInterruptiblePause(context.getExecutionControls(), "waiting-for-data", logger);
return fragProvider.getNext();
} catch(InterruptedException e) {
// Preserve evidence that the interruption occurred so that code higher up
// on the call stack can learn of the
// interruption and respond to it if it wants to.
return null;
public IterOutcome next() {
try {
RawFragmentBatch batch;
try {
batch = getNextBatch();
// skip over empty batches. we do this since these are basically control messages.
while (batch != null && batch.getHeader().getDef().getRecordCount() == 0
&& (!first || batch.getHeader().getDef().getFieldCount() == 0)) {
batch = getNextBatch();
} finally {
first = false;
if (batch == null) {
lastOutcome = IterOutcome.NONE;;
if (!context.getExecutorState().shouldContinue()) {
lastOutcome = IterOutcome.STOP;
return lastOutcome;
if (context.getAllocator().isOverLimit()) {
lastOutcome = IterOutcome.OUT_OF_MEMORY;
return lastOutcome;
RecordBatchDef rbd = batch.getHeader().getDef();
boolean schemaChanged = batchLoader.load(rbd, batch.getBody());
// TODO: Clean: DRILL-2933: That load(...) no longer throws
// SchemaChangeException, so check/clean catch clause below.
stats.addLongStat(Metric.BYTES_RECEIVED, batch.getByteCount());
if(schemaChanged) {
this.schema = batchLoader.getSchema();
stats.batchReceived(0, rbd.getRecordCount(), true);
lastOutcome = IterOutcome.OK_NEW_SCHEMA;
} else {
stats.batchReceived(0, rbd.getRecordCount(), false);
lastOutcome = IterOutcome.OK;
return lastOutcome;
} catch (SchemaChangeException | IOException ex) {
lastOutcome = IterOutcome.STOP;
return lastOutcome;
} catch (Exception e) {
lastOutcome = IterOutcome.STOP;
throw e;
} finally {
public WritableBatch getWritableBatch() {
return batchLoader.getWritableBatch();
public void close() {
public VectorContainer getOutgoingContainer() {
throw new UnsupportedOperationException(
String.format("You should not call getOutgoingContainer() for class %s",
public VectorContainer getContainer() {
return batchLoader.getContainer();
private void informSenders() {"Informing senders of request to terminate sending.");
FragmentHandle handlePrototype = FragmentHandle.newBuilder()
for (MinorFragmentEndpoint providingEndpoint : config.getProvidingEndpoints()) {
FragmentHandle sender = FragmentHandle.newBuilder(handlePrototype)
FinishedReceiver finishedReceiver = FinishedReceiver.newBuilder()
.informReceiverFinished(new OutcomeListener(), finishedReceiver);
// TODO: Code duplication. MergingRecordBatch has the same implementation.
private class OutcomeListener implements RpcOutcomeListener<Ack> {
public void failed(RpcException ex) {
logger.warn("Failed to inform upstream that receiver is finished");
public void success(Ack value, ByteBuf buffer) {
// Do nothing
public void interrupted(InterruptedException e) {
if (context.getExecutorState().shouldContinue()) {
String errMsg = "Received an interrupt RPC outcome while sending ReceiverFinished message";
logger.error(errMsg, e);
context.getExecutorState().fail(new RpcException(errMsg, e));
public void dump() {
logger.error("UnorderedReceiverBatch[batchLoader={}, schema={}]", batchLoader, schema);
public boolean hasFailed() {
return lastOutcome == IterOutcome.STOP;