blob: ffc613e30969057285de3f64bece138bd32f6b80 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.beam.sdk.fn.data;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.ConcurrentHashMap;
import java.util.concurrent.ConcurrentMap;
import java.util.concurrent.ExecutionException;
import java.util.function.BiConsumer;
import java.util.function.Consumer;
import javax.annotation.Nullable;
import org.apache.beam.model.fnexecution.v1.BeamFnApi;
import org.apache.beam.model.fnexecution.v1.BeamFnApi.Elements;
import org.apache.beam.model.pipeline.v1.Endpoints;
import org.apache.beam.sdk.fn.stream.OutboundObserverFactory;
import org.apache.beam.vendor.grpc.v1p26p0.com.google.protobuf.ByteString;
import org.apache.beam.vendor.grpc.v1p26p0.io.grpc.Status;
import org.apache.beam.vendor.grpc.v1p26p0.io.grpc.stub.StreamObserver;
import org.apache.beam.vendor.guava.v26_0_jre.com.google.common.annotations.VisibleForTesting;
import org.apache.beam.vendor.guava.v26_0_jre.com.google.common.base.MoreObjects;
import org.apache.beam.vendor.guava.v26_0_jre.com.google.common.collect.ImmutableList;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* A gRPC multiplexer for a specific {@link Endpoints.ApiServiceDescriptor}.
*
* <p>Multiplexes data for inbound consumers based upon their individual {@link
* org.apache.beam.model.fnexecution.v1.BeamFnApi.Target}s.
*
* <p>Multiplexing inbound and outbound streams is as thread safe as the consumers of those streams.
* For inbound streams, this is as thread safe as the inbound observers. For outbound streams, this
* is as thread safe as the underlying stream observer.
*
* <p>TODO: Add support for multiplexing over multiple outbound observers by stickying the output
* location with a specific outbound observer.
*/
public class BeamFnDataGrpcMultiplexer implements AutoCloseable {
private static final Logger LOG = LoggerFactory.getLogger(BeamFnDataGrpcMultiplexer.class);
@Nullable private final Endpoints.ApiServiceDescriptor apiServiceDescriptor;
private final StreamObserver<BeamFnApi.Elements> inboundObserver;
private final StreamObserver<BeamFnApi.Elements> outboundObserver;
private final ConcurrentMap<LogicalEndpoint, CompletableFuture<BiConsumer<ByteString, Boolean>>>
consumers;
public BeamFnDataGrpcMultiplexer(
@Nullable Endpoints.ApiServiceDescriptor apiServiceDescriptor,
OutboundObserverFactory outboundObserverFactory,
OutboundObserverFactory.BasicFactory<Elements, Elements> baseOutboundObserverFactory) {
this.apiServiceDescriptor = apiServiceDescriptor;
this.consumers = new ConcurrentHashMap<>();
this.inboundObserver = new InboundObserver();
this.outboundObserver =
outboundObserverFactory.outboundObserverFor(baseOutboundObserverFactory, inboundObserver);
}
@Override
public String toString() {
return MoreObjects.toStringHelper(this)
.omitNullValues()
.add("apiServiceDescriptor", apiServiceDescriptor)
.add("consumers", consumers)
.toString();
}
public StreamObserver<BeamFnApi.Elements> getInboundObserver() {
return inboundObserver;
}
public StreamObserver<BeamFnApi.Elements> getOutboundObserver() {
return outboundObserver;
}
private CompletableFuture<BiConsumer<ByteString, Boolean>> receiverFuture(
LogicalEndpoint endpoint) {
return consumers.computeIfAbsent(
endpoint, (LogicalEndpoint unused) -> new CompletableFuture<>());
}
public <T> void registerConsumer(
LogicalEndpoint inputLocation, BiConsumer<ByteString, Boolean> bytesReceiver) {
receiverFuture(inputLocation).complete(bytesReceiver);
}
@VisibleForTesting
boolean hasConsumer(LogicalEndpoint outputLocation) {
return consumers.containsKey(outputLocation);
}
@Override
public void close() {
for (CompletableFuture<BiConsumer<ByteString, Boolean>> receiver :
ImmutableList.copyOf(consumers.values())) {
// Cancel any observer waiting for the client to complete. If the receiver has already been
// completed or cancelled, this call will be ignored.
receiver.cancel(true);
}
// Cancel any outbound calls and complete any inbound calls, as this multiplexer is hanging up
outboundObserver.onError(
Status.CANCELLED.withDescription("Multiplexer hanging up").asException());
inboundObserver.onCompleted();
}
/**
* A multiplexing {@link StreamObserver} that selects the inbound {@link Consumer} to pass the
* elements to.
*
* <p>The inbound observer blocks until the {@link Consumer} is bound allowing for the sending
* harness to initiate transmitting data without needing for the receiving harness to signal that
* it is ready to consume that data.
*/
private final class InboundObserver implements StreamObserver<BeamFnApi.Elements> {
@Override
public void onNext(BeamFnApi.Elements value) {
for (BeamFnApi.Elements.Data data : value.getDataList()) {
try {
LogicalEndpoint key =
LogicalEndpoint.data(data.getInstructionId(), data.getTransformId());
CompletableFuture<BiConsumer<ByteString, Boolean>> consumer = receiverFuture(key);
if (!consumer.isDone()) {
LOG.debug(
"Received data for key {} without consumer ready. "
+ "Waiting for consumer to be registered.",
key);
}
boolean isLast = data.getIsLast() || data.getData().isEmpty();
consumer.get().accept(data.getData(), isLast);
if (isLast) {
consumers.remove(key);
}
/*
* TODO: On failure we should fail any bundles that were impacted eagerly
* instead of relying on the Runner harness to do all the failure handling.
*/
} catch (ExecutionException | InterruptedException e) {
LOG.error(
"Client interrupted during handling of data for instruction {} and transform {}",
data.getInstructionId(),
data.getTransformId(),
e);
outboundObserver.onError(e);
} catch (RuntimeException e) {
LOG.error(
"Client failed to handle data for instruction {} and transform {}",
data.getInstructionId(),
data.getTransformId(),
e);
outboundObserver.onError(e);
}
}
for (BeamFnApi.Elements.Timers timer : value.getTimersList()) {
try {
LogicalEndpoint key =
LogicalEndpoint.timer(
timer.getInstructionId(), timer.getTransformId(), timer.getTimerFamilyId());
CompletableFuture<BiConsumer<ByteString, Boolean>> consumer = receiverFuture(key);
if (!consumer.isDone()) {
LOG.debug(
"Received data for key {} without consumer ready. "
+ "Waiting for consumer to be registered.",
key);
}
boolean isLast = timer.getIsLast() || timer.getTimers().isEmpty();
consumer.get().accept(timer.getTimers(), isLast);
if (isLast) {
consumers.remove(key);
}
/*
* TODO: On failure we should fail any bundles that were impacted eagerly
* instead of relying on the Runner harness to do all the failure handling.
*/
} catch (ExecutionException | InterruptedException e) {
LOG.error(
"Client interrupted during handling of timer for instruction {}, transform {}, and timer family {}",
timer.getInstructionId(),
timer.getTransformId(),
timer.getTimerFamilyId(),
e);
outboundObserver.onError(e);
} catch (RuntimeException e) {
LOG.error(
"Client failed to handle timer for instruction {}, transform {}, and timer family {}",
timer.getInstructionId(),
timer.getTransformId(),
timer.getTimerFamilyId(),
e);
outboundObserver.onError(e);
}
}
}
@Override
public void onError(Throwable t) {
LOG.error(
"Failed to handle for {}",
apiServiceDescriptor == null ? "unknown endpoint" : apiServiceDescriptor,
t);
}
@Override
public void onCompleted() {
LOG.warn(
"Hanged up for {}.",
apiServiceDescriptor == null ? "unknown endpoint" : apiServiceDescriptor);
}
}
}