blob: 5e1ffd451883e3fc283c4b8671c70b0e37fb7630 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.physical.impl.producer;
import java.util.concurrent.BlockingDeque;
import java.util.concurrent.CountDownLatch;
import java.util.concurrent.LinkedBlockingDeque;
import org.apache.drill.common.expression.SchemaPath;
import org.apache.drill.common.types.TypeProtos.MajorType;
import org.apache.drill.exec.exception.OutOfMemoryException;
import org.apache.drill.exec.expr.TypeHelper;
import org.apache.drill.exec.ops.FragmentContext;
import org.apache.drill.exec.ops.QueryCancelledException;
import org.apache.drill.exec.physical.config.ProducerConsumer;
import org.apache.drill.exec.physical.impl.sort.RecordBatchData;
import org.apache.drill.exec.record.AbstractRecordBatch;
import org.apache.drill.exec.record.BatchSchema;
import org.apache.drill.exec.record.BatchSchema.SelectionVectorMode;
import org.apache.drill.exec.record.MaterializedField;
import org.apache.drill.exec.record.RecordBatch;
import org.apache.drill.exec.record.TransferPair;
import org.apache.drill.exec.record.VectorContainer;
import org.apache.drill.exec.record.VectorWrapper;
import org.apache.drill.exec.vector.ValueVector;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
public class ProducerConsumerBatch extends AbstractRecordBatch<ProducerConsumer> {
private static final Logger logger = LoggerFactory.getLogger(ProducerConsumerBatch.class);
private final RecordBatch incoming;
private final Thread producer = new Thread(new Producer(), Thread.currentThread().getName() + " - Producer Thread");
private boolean running = false;
private final BlockingDeque<RecordBatchDataWrapper> queue;
private int recordCount;
private BatchSchema schema;
private final CountDownLatch cleanUpLatch = new CountDownLatch(1); // used to wait producer to clean up
protected ProducerConsumerBatch(final ProducerConsumer popConfig, final FragmentContext context, final RecordBatch incoming) throws OutOfMemoryException {
super(popConfig, context);
this.incoming = incoming;
this.queue = new LinkedBlockingDeque<>(popConfig.getSize());
}
@Override
public IterOutcome innerNext() {
if (!running) {
producer.start();
running = true;
}
RecordBatchDataWrapper wrapper;
try {
stats.startWait();
wrapper = queue.take();
logger.debug("Got batch from queue");
} catch (final InterruptedException e) {
throw new QueryCancelledException();
} finally {
stats.stopWait();
}
if (wrapper.finished) {
return IterOutcome.NONE;
}
recordCount = wrapper.batch.getRecordCount();
final boolean newSchema = load(wrapper.batch);
return newSchema ? IterOutcome.OK_NEW_SCHEMA : IterOutcome.OK;
}
private boolean load(final RecordBatchData batch) {
final VectorContainer newContainer = batch.getContainer();
if (schema != null && newContainer.getSchema().equals(schema)) {
container.zeroVectors();
final BatchSchema schema = container.getSchema();
for (int i = 0; i < container.getNumberOfColumns(); i++) {
final MaterializedField field = schema.getColumn(i);
final MajorType type = field.getType();
final ValueVector vOut = container.getValueAccessorById(TypeHelper.getValueVectorClass(type.getMinorType(), type.getMode()),
container.getValueVectorId(SchemaPath.getSimplePath(field.getName())).getFieldIds()).getValueVector();
final ValueVector vIn = newContainer.getValueAccessorById(TypeHelper.getValueVectorClass(type.getMinorType(), type.getMode()),
newContainer.getValueVectorId(SchemaPath.getSimplePath(field.getName())).getFieldIds()).getValueVector();
final TransferPair tp = vIn.makeTransferPair(vOut);
tp.transfer();
}
return false;
} else {
container.clear();
for (final VectorWrapper<?> w : newContainer) {
container.add(w.getValueVector());
}
container.buildSchema(SelectionVectorMode.NONE);
schema = container.getSchema();
return true;
}
}
private class Producer implements Runnable {
RecordBatchDataWrapper wrapper;
@Override
public void run() {
boolean stop = false;
try {
outer:
while (true) {
final IterOutcome upstream = incoming.next();
switch (upstream) {
case NONE:
stop = true;
break outer;
case OK_NEW_SCHEMA:
case OK:
wrapper = RecordBatchDataWrapper.batch(new RecordBatchData(incoming, oContext.getAllocator()));
queue.put(wrapper);
wrapper = null;
break;
default:
throw new UnsupportedOperationException();
}
}
} catch (final InterruptedException e) {
logger.warn("Producer thread is interrupted.", e);
throw new QueryCancelledException();
} finally {
if (stop) {
try {
clearQueue();
queue.put(RecordBatchDataWrapper.finished());
} catch (final InterruptedException e) {
logger.error("Unable to enqueue the last batch indicator. Something is broken.", e);
// TODO InterruptedException
}
}
if (wrapper!=null) {
wrapper.batch.clear();
}
cleanUpLatch.countDown();
}
}
}
private void clearQueue() {
RecordBatchDataWrapper wrapper;
while ((wrapper = queue.poll()) != null) {
if (wrapper.batch != null) {
wrapper.batch.getContainer().clear();
}
}
}
@Override
protected void cancelIncoming() { }
@Override
public void close() {
producer.interrupt();
try {
producer.join();
} catch (final InterruptedException e) {
logger.warn("Interrupted while waiting for producer thread");
// TODO InterruptedException
}
try {
cleanUpLatch.await();
} catch (final InterruptedException e) {
logger.warn("Interrupted while waiting for producer to clean up first. I will try to clean up now...", e);
// TODO we should retry to wait for the latch
throw new QueryCancelledException();
} finally {
super.close();
clearQueue();
}
}
@Override
public int getRecordCount() {
return recordCount;
}
private static class RecordBatchDataWrapper {
final RecordBatchData batch;
final boolean finished;
RecordBatchDataWrapper(final RecordBatchData batch, final boolean finished) {
this.batch = batch;
this.finished = finished;
}
public static RecordBatchDataWrapper batch(final RecordBatchData batch) {
return new RecordBatchDataWrapper(batch, false);
}
public static RecordBatchDataWrapper finished() {
return new RecordBatchDataWrapper(null, true);
}
}
@Override
public void dump() {
logger.error("ProducerConsumerBatch[container={}, recordCount={}, schema={}]",
container, recordCount, schema);
}
}