| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| package org.apache.nemo.common.test; |
| |
| import com.fasterxml.jackson.databind.node.ObjectNode; |
| import org.apache.beam.sdk.values.KV; |
| import org.apache.nemo.common.KeyExtractor; |
| import org.apache.nemo.common.coder.DecoderFactory; |
| import org.apache.nemo.common.coder.EncoderFactory; |
| import org.apache.nemo.common.dag.DAGBuilder; |
| import org.apache.nemo.common.ir.IRDAG; |
| import org.apache.nemo.common.ir.OutputCollector; |
| import org.apache.nemo.common.ir.Readable; |
| import org.apache.nemo.common.ir.edge.IREdge; |
| import org.apache.nemo.common.ir.edge.executionproperty.*; |
| import org.apache.nemo.common.ir.vertex.IRVertex; |
| import org.apache.nemo.common.ir.vertex.OperatorVertex; |
| import org.apache.nemo.common.ir.vertex.SourceVertex; |
| import org.apache.nemo.common.ir.vertex.transform.NoWatermarkEmitTransform; |
| import org.apache.nemo.common.ir.vertex.transform.Transform; |
| |
| import java.io.IOException; |
| import java.util.ArrayList; |
| import java.util.List; |
| |
| /** |
| * Empty components to mock transform and source, for tests and examples. |
| */ |
| public final class EmptyComponents { |
| public static final Transform EMPTY_TRANSFORM = new EmptyTransform(""); |
| |
| /** |
| * private constructor. |
| */ |
| private EmptyComponents() { |
| } |
| |
| public static IREdge newDummyShuffleEdge(final IRVertex src, final IRVertex dst) { |
| final IREdge edge = new IREdge(CommunicationPatternProperty.Value.SHUFFLE, src, dst); |
| edge.setProperty(KeyExtractorProperty.of(new DummyBeamKeyExtractor())); |
| edge.setProperty(KeyEncoderProperty.of(new EncoderFactory.DummyEncoderFactory())); |
| edge.setProperty(KeyDecoderProperty.of(new DecoderFactory.DummyDecoderFactory())); |
| edge.setProperty(EncoderProperty.of(new EncoderFactory.DummyEncoderFactory())); |
| edge.setProperty(DecoderProperty.of(new DecoderFactory.DummyDecoderFactory())); |
| edge.setProperty(KeyEncoderProperty.of(new EncoderFactory.DummyEncoderFactory())); |
| edge.setProperty(KeyDecoderProperty.of(new DecoderFactory.DummyDecoderFactory())); |
| return edge; |
| } |
| |
| /** |
| * Builds dummy IR DAG for testing. |
| * |
| * @return the dummy IR DAG. |
| */ |
| public static IRDAG buildEmptyDAG() { |
| DAGBuilder<IRVertex, IREdge> dagBuilder = new DAGBuilder<>(); |
| final IRVertex s = new EmptyComponents.EmptySourceVertex<>("s"); |
| final IRVertex t1 = new OperatorVertex(new EmptyComponents.EmptyTransform("t1")); |
| final IRVertex t2 = new OperatorVertex(new EmptyComponents.EmptyTransform("t2")); |
| final IRVertex t3 = new OperatorVertex(new EmptyComponents.EmptyTransform("t3")); |
| final IRVertex t4 = new OperatorVertex(new EmptyComponents.EmptyTransform("t4")); |
| final IRVertex t5 = new OperatorVertex(new EmptyComponents.EmptyTransform("t5")); |
| dagBuilder.addVertex(s); |
| dagBuilder.addVertex(t1); |
| dagBuilder.addVertex(t2); |
| dagBuilder.addVertex(t3); |
| dagBuilder.addVertex(t4); |
| dagBuilder.addVertex(t5); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, s, t1)); |
| dagBuilder.connectVertices(newDummyShuffleEdge(t1, t2)); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, t2, t3)); |
| dagBuilder.connectVertices(newDummyShuffleEdge(t3, t4)); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, t2, t5)); |
| return new IRDAG(dagBuilder.build()); |
| } |
| |
| /** |
| * Builds dummy IR DAG to test skew handling. |
| * For DataSkewPolicy, shuffle edges needs extra setting for EncoderProperty, DecoderProperty |
| * and KeyExtractorProperty by default. |
| * |
| * @return the dummy IR DAG. |
| */ |
| public static IRDAG buildEmptyDAGForSkew() { |
| DAGBuilder<IRVertex, IREdge> dagBuilder = new DAGBuilder<>(); |
| final IRVertex s = new EmptyComponents.EmptySourceVertex<>("s"); |
| final IRVertex t1 = new OperatorVertex(new EmptyComponents.EmptyTransform("t1")); |
| final IRVertex t2 = new OperatorVertex(new EmptyComponents.EmptyTransform("t2")); |
| final IRVertex t3 = new OperatorVertex(new EmptyComponents.EmptyTransform("t3")); |
| final IRVertex t4 = new OperatorVertex(new EmptyComponents.EmptyTransform("t4")); |
| final IRVertex t5 = new OperatorVertex(new EmptyComponents.EmptyTransform("t5")); |
| |
| final IREdge shuffleEdgeBetweenT1AndT2 = newDummyShuffleEdge(t1, t2); |
| final IREdge shuffleEdgeBetweenT3AndT4 = newDummyShuffleEdge(t3, t4); |
| |
| dagBuilder.addVertex(s); |
| dagBuilder.addVertex(t1); |
| dagBuilder.addVertex(t2); |
| dagBuilder.addVertex(t3); |
| dagBuilder.addVertex(t4); |
| dagBuilder.addVertex(t5); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, s, t1)); |
| dagBuilder.connectVertices(shuffleEdgeBetweenT1AndT2); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, t2, t3)); |
| dagBuilder.connectVertices(shuffleEdgeBetweenT3AndT4); |
| dagBuilder.connectVertices(new IREdge(CommunicationPatternProperty.Value.ONE_TO_ONE, t2, t5)); |
| return new IRDAG(dagBuilder.build()); |
| } |
| |
| /** |
| * Dummy beam key extractor. |
| **/ |
| static class DummyBeamKeyExtractor implements KeyExtractor { |
| @Override |
| public Object extractKey(final Object element) { |
| if (element instanceof KV) { |
| // Handle null keys, since Beam allows KV with null keys. |
| final Object key = ((KV) element).getKey(); |
| return key == null ? 0 : key; |
| } else { |
| return element; |
| } |
| } |
| } |
| |
| /** |
| * An empty transform. |
| * |
| * @param <I> input type. |
| * @param <O> output type. |
| */ |
| public static class EmptyTransform<I, O> extends NoWatermarkEmitTransform<I, O> { |
| private final String name; |
| |
| /** |
| * Default constructor. |
| * |
| * @param name name of the empty transform. |
| */ |
| public EmptyTransform(final String name) { |
| this.name = name; |
| } |
| |
| @Override |
| public final String toString() { |
| final StringBuilder sb = new StringBuilder(); |
| sb.append(super.toString()); |
| sb.append(", name: "); |
| sb.append(name); |
| return sb.toString(); |
| } |
| |
| @Override |
| public void prepare(final Context context, final OutputCollector<O> outputCollector) { |
| // Do nothing in an EmptyTransform. |
| } |
| |
| @Override |
| public void onData(final I element) { |
| // Do nothing in an EmptyTransform. |
| } |
| |
| @Override |
| public void close() { |
| // Do nothing in an EmptyTransform. |
| } |
| } |
| |
| /** |
| * An empty Source Vertex. |
| * |
| * @param <T> type of the data. |
| */ |
| public static final class EmptySourceVertex<T> extends SourceVertex<T> { |
| private String name; |
| private int minNumReadables; |
| |
| /** |
| * Constructor. |
| * |
| * @param name name for the vertex. |
| */ |
| public EmptySourceVertex(final String name) { |
| new EmptySourceVertex(name, 1); |
| } |
| |
| /** |
| * Constructor. |
| * |
| * @param name name for the vertex. |
| * @param minNumReadables for the vertex. |
| */ |
| public EmptySourceVertex(final String name, final int minNumReadables) { |
| this.name = name; |
| this.minNumReadables = minNumReadables; |
| } |
| |
| /** |
| * Copy Constructor for EmptySourceVertex. |
| * |
| * @param that the source object for copying |
| */ |
| private EmptySourceVertex(final EmptySourceVertex that) { |
| this.name = that.name; |
| } |
| |
| @Override |
| public String toString() { |
| final StringBuilder sb = new StringBuilder(); |
| sb.append(super.toString()); |
| sb.append(", name: "); |
| sb.append(name); |
| return sb.toString(); |
| } |
| |
| @Override |
| public ObjectNode getPropertiesAsJsonNode() { |
| final ObjectNode node = getIRVertexPropertiesAsJsonNode(); |
| node.put("source", "EmptySourceVertex(" + name + " / minNumReadables: " + minNumReadables + ")"); |
| return node; |
| } |
| |
| @Override |
| public boolean isBounded() { |
| return true; |
| } |
| |
| @Override |
| public List<Readable<T>> getReadables(final int desirednumOfSplits) { |
| final List<Readable<T>> list = new ArrayList<>(Math.max(minNumReadables, desirednumOfSplits)); |
| for (int i = 0; i < Math.max(minNumReadables, desirednumOfSplits); i++) { |
| list.add(new EmptyReadable<>()); |
| } |
| return list; |
| } |
| |
| @Override |
| public long getEstimatedSizeBytes() { |
| return 0L; |
| } |
| |
| @Override |
| public void clearInternalStates() { |
| } |
| |
| @Override |
| public EmptySourceVertex<T> getClone() { |
| return new EmptySourceVertex<>(this); |
| } |
| } |
| |
| /** |
| * An empty reader. |
| * |
| * @param <T> type of the data. |
| */ |
| static final class EmptyReadable<T> implements Readable<T> { |
| @Override |
| public void prepare() { |
| |
| } |
| |
| @Override |
| public T readCurrent() { |
| return null; |
| } |
| |
| @Override |
| public long readWatermark() { |
| return 0; |
| } |
| |
| @Override |
| public boolean isFinished() { |
| return true; |
| } |
| |
| @Override |
| public List<String> getLocations() { |
| throw new UnsupportedOperationException(); |
| } |
| |
| @Override |
| public void close() throws IOException { |
| |
| } |
| } |
| } |