| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.wayang.spark.operators; |
| |
| import java.util.Collection; |
| import org.apache.spark.api.java.JavaPairRDD; |
| import org.apache.spark.api.java.JavaRDD; |
| import org.apache.wayang.core.optimizer.OptimizationContext; |
| import org.apache.wayang.core.plan.wayangplan.ExecutionOperator; |
| import org.apache.wayang.core.platform.ChannelInstance; |
| import org.apache.wayang.core.platform.lineage.ExecutionLineageNode; |
| import org.apache.wayang.core.util.Tuple; |
| import org.apache.wayang.spark.execution.SparkExecutor; |
| import org.apache.wayang.spark.platform.SparkPlatform; |
| |
| /** |
| * Execution operator for the {@link SparkPlatform}. |
| */ |
| public interface SparkExecutionOperator extends ExecutionOperator { |
| |
| @Override |
| default SparkPlatform getPlatform() { |
| return SparkPlatform.getInstance(); |
| } |
| |
| /** |
| * Evaluates this operator. Takes a set of {@link ChannelInstance}s according to the operator inputs and manipulates |
| * a set of {@link ChannelInstance}s according to the operator outputs -- unless the operator is a sink, then it triggers |
| * execution. |
| * <p>In addition, this method should give feedback of what this instance was doing by wiring the |
| * {@link org.apache.wayang.core.platform.lineage.LazyExecutionLineageNode}s of input and ouput {@link ChannelInstance}s and |
| * providing a {@link Collection} of executed {@link ExecutionLineageNode}s.</p> |
| * |
| * @param inputs {@link ChannelInstance}s that satisfy the inputs of this operator |
| * @param outputs {@link ChannelInstance}s that accept the outputs of this operator |
| * @param sparkExecutor {@link SparkExecutor} that executes this instance |
| * @param operatorContext optimization information for this instance |
| * @return {@link Collection}s of what has been executed and produced |
| */ |
| Tuple<Collection<ExecutionLineageNode>, Collection<ChannelInstance>> evaluate( |
| ChannelInstance[] inputs, |
| ChannelInstance[] outputs, |
| SparkExecutor sparkExecutor, |
| OptimizationContext.OperatorContext operatorContext); |
| |
| /** |
| * Tell whether this instances is a Spark action. This is important to keep track on when Spark is actually |
| * initialized. |
| * |
| * @return whether this instance issues Spark actions |
| */ |
| boolean containsAction(); |
| |
| /** |
| * Utility method to name an RDD according to this instance's name. |
| * |
| * @param rdd that should be renamed |
| * @see #getName() |
| */ |
| default void name(JavaRDD<?> rdd) { |
| if (this.getName() != null) { |
| rdd.setName(this.getName()); |
| } else { |
| rdd.setName(this.toString()); |
| } |
| } |
| |
| /** |
| * Utility method to name an RDD according to this instance's name. |
| * |
| * @param rdd that should be renamed |
| * @see #getName() |
| */ |
| default void name(JavaPairRDD<?, ?> rdd) { |
| if (this.getName() != null) { |
| rdd.setName(this.getName()); |
| } else { |
| rdd.setName(this.toString()); |
| } |
| } |
| |
| } |