compiler/frontend/spark/src/main/java/org/apache/nemo/compiler/frontend/spark/core/rdd/SparkJavaRDD.java - incubator-nemo - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */
 package org.apache.nemo.compiler.frontend.spark.core.rdd;

 import org.apache.nemo.common.dag.DAG;
 import org.apache.nemo.common.dag.DAGBuilder;
 import org.apache.nemo.common.ir.edge.IREdge;
 import org.apache.nemo.common.ir.vertex.IRVertex;
 import org.apache.nemo.common.ir.vertex.InMemorySourceVertex;
 import org.apache.nemo.common.ir.vertex.executionproperty.ParallelismProperty;
 import org.apache.nemo.compiler.frontend.spark.core.SparkFrontendUtils;
 import org.apache.nemo.compiler.frontend.spark.source.SparkDatasetBoundedSourceVertex;
 import org.apache.nemo.compiler.frontend.spark.source.SparkTextFileBoundedSourceVertex;
 import org.apache.nemo.compiler.frontend.spark.sql.Dataset;
 import org.apache.nemo.compiler.frontend.spark.sql.SparkSession;
 import org.apache.spark.Partition;
 import org.apache.spark.Partitioner;
 import org.apache.spark.SparkContext;
 import org.apache.spark.TaskContext;
 import org.apache.spark.api.java.JavaFutureAction;
 import org.apache.spark.api.java.Optional;
 import org.apache.spark.api.java.function.*;
 import org.apache.spark.partial.BoundedDouble;
 import org.apache.spark.partial.PartialResult;
 import org.apache.spark.storage.StorageLevel;
 import scala.Option;
 import scala.Tuple2;
 import scala.reflect.ClassTag$;

 import java.util.Comparator;
 import java.util.Iterator;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.atomic.AtomicInteger;

 /**
  * Java RDD.
  *
  * @param <T> type of the final element.
  */
 public final class SparkJavaRDD<T> extends org.apache.spark.api.java.JavaRDD<T> {

   private final RDD<T> rdd;
   private static final String NOT_YET_SUPPORTED = "Operation not yet supported.";

   /**
    * Static method to create a RDD object from an iterable object.
    *
    * @param sparkContext spark context containing configurations.
    * @param initialData  initial data.
    * @param parallelism  parallelism information.
    * @param <T>          type of the resulting object.
    * @return the new SparkJavaRDD object.
    */
   public static <T> SparkJavaRDD<T> of(final SparkContext sparkContext,
                                        final Iterable<T> initialData,
                                        final Integer parallelism) {
     final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

     final IRVertex initializedSourceVertex = new InMemorySourceVertex<>(initialData);
     initializedSourceVertex.setProperty(ParallelismProperty.of(parallelism));
     builder.addVertex(initializedSourceVertex);

     final RDD<T> nemoRdd = new RDD<>(sparkContext, builder.buildWithoutSourceSinkCheck(),
       initializedSourceVertex, Option.empty(), ClassTag$.MODULE$.apply(Object.class));

     return new SparkJavaRDD<>(nemoRdd);
   }

   /**
    * Static method to create a SparkJavaRDD object from an text file.
    *
    * @param sparkContext  the spark context containing configurations.
    * @param minPartitions the minimum number of partitions.
    * @param inputPath     the path of the input text file.
    * @return the new SparkJavaRDD object
    */
   public static SparkJavaRDD<String> of(final SparkContext sparkContext,
                                         final int minPartitions,
                                         final String inputPath) {
     final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

     final org.apache.spark.rdd.RDD<String> textRdd = sparkContext.textFile(inputPath, minPartitions);
     final int numPartitions = textRdd.getNumPartitions();
     final IRVertex textSourceVertex = new SparkTextFileBoundedSourceVertex(sparkContext, inputPath, numPartitions);
     textSourceVertex.setProperty(ParallelismProperty.of(numPartitions));
     builder.addVertex(textSourceVertex);

     return new SparkJavaRDD<>(textRdd, sparkContext, builder.buildWithoutSourceSinkCheck(), textSourceVertex);
   }

   /**
    * Static method to create a SparkJavaRDD object from a Dataset.
    *
    * @param sparkSession spark session containing configurations.
    * @param dataset      dataset to read initial data from.
    * @param <T>          type of the resulting object.
    * @return the new SparkJavaRDD object.
    */
   public static <T> SparkJavaRDD<T> of(final SparkSession sparkSession,
                                        final Dataset<T> dataset) {
     final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

     final IRVertex sparkBoundedSourceVertex = new SparkDatasetBoundedSourceVertex<>(sparkSession, dataset);
     final org.apache.spark.rdd.RDD<T> sparkRDD = dataset.sparkRDD();
     sparkBoundedSourceVertex.setProperty(ParallelismProperty.of(sparkRDD.getNumPartitions()));
     builder.addVertex(sparkBoundedSourceVertex);

     return new SparkJavaRDD<>(
       sparkRDD, sparkSession.sparkContext(), builder.buildWithoutSourceSinkCheck(), sparkBoundedSourceVertex);
   }

   /**
    * Static method to create a SparkJavaRDD object from {@link RDD}.
    *
    * @param rddFrom the RDD to parse.
    * @param <T>     type of the resulting object.
    * @return the parsed SparkJavaRDD object.
    */
   public static <T> SparkJavaRDD<T> fromRDD(final RDD<T> rddFrom) {
     return new SparkJavaRDD<>(rddFrom);
   }

   @Override
   public SparkJavaRDD<T> wrapRDD(final org.apache.spark.rdd.RDD<T> rddFrom) {
     if (!(rddFrom instanceof RDD)) {
       throw new UnsupportedOperationException("Cannot wrap Spark RDD as Nemo RDD!");
     }
     return fromRDD((RDD<T>) rddFrom);
   }

   @Override
   public RDD<T> rdd() {
     return rdd;
   }

   /**
    * Constructor with existing nemo RDD.
    *
    * @param rdd the Nemo rdd to wrap.
    */
   SparkJavaRDD(final RDD<T> rdd) {
     super(rdd, ClassTag$.MODULE$.apply(Object.class));
     this.rdd = rdd;
   }

   /**
    * Constructor with Spark source RDD.
    *
    * @param sparkRDD     the Spark source rdd to wrap.
    * @param sparkContext the Spark context in the wrapped rdd.
    * @param dag          the IR DAG in construction.
    * @param lastVertex   the last vertex of the DAG in construction.
    */
   SparkJavaRDD(final org.apache.spark.rdd.RDD<T> sparkRDD,
                final SparkContext sparkContext,
                final DAG<IRVertex, IREdge> dag,
                final IRVertex lastVertex) {
     super(sparkRDD, ClassTag$.MODULE$.apply(Object.class));

     this.rdd = new RDD<>(sparkContext, dag, lastVertex, Option.apply(sparkRDD), ClassTag$.MODULE$.apply(Object.class));
   }

   /////////////// TRANSFORMATIONS ///////////////

   /**
    * Map transform.
    *
    * @param func function to apply.
    * @param <O>  output type.
    * @return the SparkJavaRDD with the extended DAG.
    */
   @Override
   public <O> SparkJavaRDD<O> map(final Function<T, O> func) {
     return rdd.map(func, ClassTag$.MODULE$.apply(Object.class)).toJavaRDD();
   }

   /**
    * Flat map transform.
    *
    * @param func function to apply.
    * @param <O>  output type.
    * @return the SparkJavaRDD with the extended DAG.
    */
   @Override
   public <O> SparkJavaRDD<O> flatMap(final FlatMapFunction<T, O> func) {
     return rdd.flatMap(func, ClassTag$.MODULE$.apply(Object.class)).toJavaRDD();
   }

   /////////////// TRANSFORMATION TO PAIR RDD ///////////////

   /**
    * @see org.apache.spark.api.java.JavaRDD#mapToPair : PairFunction.
    */
   @Override
   public <K2, V2> SparkJavaPairRDD<K2, V2> mapToPair(final PairFunction<T, K2, V2> f) {
     final RDD<Tuple2<K2, V2>> pairRdd =
       rdd.map(SparkFrontendUtils.pairFunctionToPlainFunction(f), ClassTag$.MODULE$.apply(Object.class));
     return SparkJavaPairRDD.fromRDD(pairRdd);
   }

   /////////////// ACTIONS ///////////////

   private static final AtomicInteger RESULT_ID = new AtomicInteger(0);

   /**
    * This method is to be removed after a result handler is implemented.
    *
    * @return a unique integer.
    */
   public static Integer getResultId() {
     return RESULT_ID.getAndIncrement();
   }

   /**
    * Reduce action.
    *
    * @param func function (binary operator) to apply.
    * @return the result of the reduce action.
    */
   @Override
   public T reduce(final Function2<T, T, T> func) {
     return rdd.reduce(func);
   }

   @Override
   public List<T> collect() {
     return rdd.collectAsList();
   }

   @Override
   public void saveAsTextFile(final String path) {
     rdd.saveAsTextFile(path);
   }

   /////////////// CACHING ///////////////

   @Override
   public SparkJavaRDD<T> persist(final StorageLevel newLevel) {
     return rdd.persist(newLevel).toJavaRDD();
   }

   @Override
   public SparkJavaRDD<T> cache() {
     return rdd.cache().toJavaRDD();
   }

   /**
    * TODO#92: Implement the unimplemented transformations/actions & dataset initialization methods for Spark frontend.
    */

   @Override
   public SparkJavaRDD<T> coalesce(final int numPartitions) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> coalesce(final int numPartitions, final boolean shuffle) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> distinct() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> distinct(final int numPartitions) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> filter(final Function<T, Boolean> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<List<T>> glom() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> SparkJavaRDD<U> mapPartitions(final FlatMapFunction<Iterator<T>, U> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> SparkJavaRDD<U> mapPartitions(final FlatMapFunction<Iterator<T>, U> f,
                                            final boolean preservesPartitioning) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <R> SparkJavaRDD<R> mapPartitionsWithIndex(final Function2<Integer, Iterator<T>, Iterator<R>> f,
                                                     final boolean preservesPartitioning) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T>[] randomSplit(final double[] weights) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T>[] randomSplit(final double[] weights, final long seed) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> repartition(final int numPartitions) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> sample(final boolean withReplacement, final double fraction) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> sample(final boolean withReplacement, final double fraction, final long seed) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> setName(final String name) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <S> SparkJavaRDD<T> sortBy(final Function<T, S> f, final boolean ascending, final int numPartitions) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> unpersist() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaRDD<T> unpersist(final boolean blocking) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <K2, V2> SparkJavaPairRDD<K2, V2> flatMapToPair(final PairFlatMapFunction<T, K2, V2> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> SparkJavaPairRDD<U, Iterable<T>> groupBy(final Function<T, U> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> SparkJavaPairRDD<U, Iterable<T>> groupBy(final Function<T, U> f, final int numPartitions) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> SparkJavaPairRDD<U, T> keyBy(final Function<T, U> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <K2, V2> SparkJavaPairRDD<K2, V2> mapPartitionsToPair(final PairFlatMapFunction<Iterator<T>, K2, V2> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <K2, V2> SparkJavaPairRDD<K2, V2> mapPartitionsToPair(
     final PairFlatMapFunction<java.util.Iterator<T>, K2, V2> f,
     final boolean preservesPartitioning) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaPairRDD<T, Long> zipWithIndex() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public SparkJavaPairRDD<T, Long> zipWithUniqueId() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   /////////////// ACTIONS ///////////////

   @Override
   public <U> U aggregate(final U zeroValue, final Function2<U, T, U> seqOp, final Function2<U, U, U> combOp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public void checkpoint() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }


   @Override
   public JavaFutureAction<List<T>> collectAsync() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T>[] collectPartitions(final int[] partitionIds) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public long count() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public PartialResult<BoundedDouble> countApprox(final long timeout) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public PartialResult<BoundedDouble> countApprox(final long timeout, final double confidence) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public long countApproxDistinct(final double relativeSD) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public JavaFutureAction<Long> countAsync() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public Map<T, Long> countByValue() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public PartialResult<Map<T, BoundedDouble>> countByValueApprox(final long timeout) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public PartialResult<Map<T, BoundedDouble>> countByValueApprox(final long timeout, final double confidence) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T first() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T fold(final T zeroValue, final Function2<T, T, T> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public void foreach(final VoidFunction<T> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public JavaFutureAction<Void> foreachAsync(final VoidFunction<T> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public void foreachPartition(final VoidFunction<Iterator<T>> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public JavaFutureAction<Void> foreachPartitionAsync(final VoidFunction<Iterator<T>> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public Optional<String> getCheckpointFile() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public int getNumPartitions() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public StorageLevel getStorageLevel() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public int id() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public boolean isCheckpointed() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public boolean isEmpty() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public Iterator<T> iterator(final Partition split, final TaskContext taskContext) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T max(final Comparator<T> comp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T min(final Comparator<T> comp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public String name() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public org.apache.spark.api.java.Optional<Partitioner> partitioner() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<Partition> partitions() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public void saveAsObjectFile(final String path) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public void saveAsTextFile(final String path,
                              final Class<? extends org.apache.hadoop.io.compress.CompressionCodec> codec) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> take(final int num) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public JavaFutureAction<List<T>> takeAsync(final int num) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> takeOrdered(final int num) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> takeOrdered(final int num, final Comparator<T> comp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> takeSample(final boolean withReplacement, final int num) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> takeSample(final boolean withReplacement, final int num, final long seed) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public String toDebugString() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public Iterator<T> toLocalIterator() {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> top(final int num) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public List<T> top(final int num, final Comparator<T> comp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> U treeAggregate(final U zeroValue, final Function2<U, T, U> seqOp, final Function2<U, U, U> combOp) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public <U> U treeAggregate(final U zeroValue, final Function2<U, T, U> seqOp,
                              final Function2<U, U, U> combOp, final int depth) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T treeReduce(final Function2<T, T, T> f) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }

   @Override
   public T treeReduce(final Function2<T, T, T> f, final int depth) {
     throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
   }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing,
	* software distributed under the License is distributed on an
	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	* KIND, either express or implied. See the License for the
	* specific language governing permissions and limitations
	* under the License.
	*/
	package org.apache.nemo.compiler.frontend.spark.core.rdd;

	import org.apache.nemo.common.dag.DAG;
	import org.apache.nemo.common.dag.DAGBuilder;
	import org.apache.nemo.common.ir.edge.IREdge;
	import org.apache.nemo.common.ir.vertex.IRVertex;
	import org.apache.nemo.common.ir.vertex.InMemorySourceVertex;
	import org.apache.nemo.common.ir.vertex.executionproperty.ParallelismProperty;
	import org.apache.nemo.compiler.frontend.spark.core.SparkFrontendUtils;
	import org.apache.nemo.compiler.frontend.spark.source.SparkDatasetBoundedSourceVertex;
	import org.apache.nemo.compiler.frontend.spark.source.SparkTextFileBoundedSourceVertex;
	import org.apache.nemo.compiler.frontend.spark.sql.Dataset;
	import org.apache.nemo.compiler.frontend.spark.sql.SparkSession;
	import org.apache.spark.Partition;
	import org.apache.spark.Partitioner;
	import org.apache.spark.SparkContext;
	import org.apache.spark.TaskContext;
	import org.apache.spark.api.java.JavaFutureAction;
	import org.apache.spark.api.java.Optional;
	import org.apache.spark.api.java.function.*;
	import org.apache.spark.partial.BoundedDouble;
	import org.apache.spark.partial.PartialResult;
	import org.apache.spark.storage.StorageLevel;
	import scala.Option;
	import scala.Tuple2;
	import scala.reflect.ClassTag$;

	import java.util.Comparator;
	import java.util.Iterator;
	import java.util.List;
	import java.util.Map;
	import java.util.concurrent.atomic.AtomicInteger;

	/**
	* Java RDD.
	*
	* @param <T> type of the final element.
	*/
	public final class SparkJavaRDD<T> extends org.apache.spark.api.java.JavaRDD<T> {

	private final RDD<T> rdd;
	private static final String NOT_YET_SUPPORTED = "Operation not yet supported.";

	/**
	* Static method to create a RDD object from an iterable object.
	*
	* @param sparkContext spark context containing configurations.
	* @param initialData initial data.
	* @param parallelism parallelism information.
	* @param <T> type of the resulting object.
	* @return the new SparkJavaRDD object.
	*/
	public static <T> SparkJavaRDD<T> of(final SparkContext sparkContext,
	final Iterable<T> initialData,
	final Integer parallelism) {
	final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

	final IRVertex initializedSourceVertex = new InMemorySourceVertex<>(initialData);
	initializedSourceVertex.setProperty(ParallelismProperty.of(parallelism));
	builder.addVertex(initializedSourceVertex);

	final RDD<T> nemoRdd = new RDD<>(sparkContext, builder.buildWithoutSourceSinkCheck(),
	initializedSourceVertex, Option.empty(), ClassTag$.MODULE$.apply(Object.class));

	return new SparkJavaRDD<>(nemoRdd);
	}

	/**
	* Static method to create a SparkJavaRDD object from an text file.
	*
	* @param sparkContext the spark context containing configurations.
	* @param minPartitions the minimum number of partitions.
	* @param inputPath the path of the input text file.
	* @return the new SparkJavaRDD object
	*/
	public static SparkJavaRDD<String> of(final SparkContext sparkContext,
	final int minPartitions,
	final String inputPath) {
	final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

	final org.apache.spark.rdd.RDD<String> textRdd = sparkContext.textFile(inputPath, minPartitions);
	final int numPartitions = textRdd.getNumPartitions();
	final IRVertex textSourceVertex = new SparkTextFileBoundedSourceVertex(sparkContext, inputPath, numPartitions);
	textSourceVertex.setProperty(ParallelismProperty.of(numPartitions));
	builder.addVertex(textSourceVertex);

	return new SparkJavaRDD<>(textRdd, sparkContext, builder.buildWithoutSourceSinkCheck(), textSourceVertex);
	}

	/**
	* Static method to create a SparkJavaRDD object from a Dataset.
	*
	* @param sparkSession spark session containing configurations.
	* @param dataset dataset to read initial data from.
	* @param <T> type of the resulting object.
	* @return the new SparkJavaRDD object.
	*/
	public static <T> SparkJavaRDD<T> of(final SparkSession sparkSession,
	final Dataset<T> dataset) {
	final DAGBuilder<IRVertex, IREdge> builder = new DAGBuilder<>();

	final IRVertex sparkBoundedSourceVertex = new SparkDatasetBoundedSourceVertex<>(sparkSession, dataset);
	final org.apache.spark.rdd.RDD<T> sparkRDD = dataset.sparkRDD();
	sparkBoundedSourceVertex.setProperty(ParallelismProperty.of(sparkRDD.getNumPartitions()));
	builder.addVertex(sparkBoundedSourceVertex);

	return new SparkJavaRDD<>(
	sparkRDD, sparkSession.sparkContext(), builder.buildWithoutSourceSinkCheck(), sparkBoundedSourceVertex);
	}

	/**
	* Static method to create a SparkJavaRDD object from {@link RDD}.
	*
	* @param rddFrom the RDD to parse.
	* @param <T> type of the resulting object.
	* @return the parsed SparkJavaRDD object.
	*/
	public static <T> SparkJavaRDD<T> fromRDD(final RDD<T> rddFrom) {
	return new SparkJavaRDD<>(rddFrom);
	}

	@Override
	public SparkJavaRDD<T> wrapRDD(final org.apache.spark.rdd.RDD<T> rddFrom) {
	if (!(rddFrom instanceof RDD)) {
	throw new UnsupportedOperationException("Cannot wrap Spark RDD as Nemo RDD!");
	}
	return fromRDD((RDD<T>) rddFrom);
	}

	@Override
	public RDD<T> rdd() {
	return rdd;
	}

	/**
	* Constructor with existing nemo RDD.
	*
	* @param rdd the Nemo rdd to wrap.
	*/
	SparkJavaRDD(final RDD<T> rdd) {
	super(rdd, ClassTag$.MODULE$.apply(Object.class));
	this.rdd = rdd;
	}

	/**
	* Constructor with Spark source RDD.
	*
	* @param sparkRDD the Spark source rdd to wrap.
	* @param sparkContext the Spark context in the wrapped rdd.
	* @param dag the IR DAG in construction.
	* @param lastVertex the last vertex of the DAG in construction.
	*/
	SparkJavaRDD(final org.apache.spark.rdd.RDD<T> sparkRDD,
	final SparkContext sparkContext,
	final DAG<IRVertex, IREdge> dag,
	final IRVertex lastVertex) {
	super(sparkRDD, ClassTag$.MODULE$.apply(Object.class));

	this.rdd = new RDD<>(sparkContext, dag, lastVertex, Option.apply(sparkRDD), ClassTag$.MODULE$.apply(Object.class));
	}

	/////////////// TRANSFORMATIONS ///////////////

	/**
	* Map transform.
	*
	* @param func function to apply.
	* @param <O> output type.
	* @return the SparkJavaRDD with the extended DAG.
	*/
	@Override
	public <O> SparkJavaRDD<O> map(final Function<T, O> func) {
	return rdd.map(func, ClassTag$.MODULE$.apply(Object.class)).toJavaRDD();
	}

	/**
	* Flat map transform.
	*
	* @param func function to apply.
	* @param <O> output type.
	* @return the SparkJavaRDD with the extended DAG.
	*/
	@Override
	public <O> SparkJavaRDD<O> flatMap(final FlatMapFunction<T, O> func) {
	return rdd.flatMap(func, ClassTag$.MODULE$.apply(Object.class)).toJavaRDD();
	}

	/////////////// TRANSFORMATION TO PAIR RDD ///////////////

	/**
	* @see org.apache.spark.api.java.JavaRDD#mapToPair : PairFunction.
	*/
	@Override
	public <K2, V2> SparkJavaPairRDD<K2, V2> mapToPair(final PairFunction<T, K2, V2> f) {
	final RDD<Tuple2<K2, V2>> pairRdd =
	rdd.map(SparkFrontendUtils.pairFunctionToPlainFunction(f), ClassTag$.MODULE$.apply(Object.class));
	return SparkJavaPairRDD.fromRDD(pairRdd);
	}

	/////////////// ACTIONS ///////////////

	private static final AtomicInteger RESULT_ID = new AtomicInteger(0);

	/**
	* This method is to be removed after a result handler is implemented.
	*
	* @return a unique integer.
	*/
	public static Integer getResultId() {
	return RESULT_ID.getAndIncrement();
	}

	/**
	* Reduce action.
	*
	* @param func function (binary operator) to apply.
	* @return the result of the reduce action.
	*/
	@Override
	public T reduce(final Function2<T, T, T> func) {
	return rdd.reduce(func);
	}

	@Override
	public List<T> collect() {
	return rdd.collectAsList();
	}

	@Override
	public void saveAsTextFile(final String path) {
	rdd.saveAsTextFile(path);
	}

	/////////////// CACHING ///////////////

	@Override
	public SparkJavaRDD<T> persist(final StorageLevel newLevel) {
	return rdd.persist(newLevel).toJavaRDD();
	}

	@Override
	public SparkJavaRDD<T> cache() {
	return rdd.cache().toJavaRDD();
	}

	/**
	* TODO#92: Implement the unimplemented transformations/actions & dataset initialization methods for Spark frontend.
	*/

	@Override
	public SparkJavaRDD<T> coalesce(final int numPartitions) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> coalesce(final int numPartitions, final boolean shuffle) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> distinct() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> distinct(final int numPartitions) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> filter(final Function<T, Boolean> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<List<T>> glom() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> SparkJavaRDD<U> mapPartitions(final FlatMapFunction<Iterator<T>, U> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> SparkJavaRDD<U> mapPartitions(final FlatMapFunction<Iterator<T>, U> f,
	final boolean preservesPartitioning) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <R> SparkJavaRDD<R> mapPartitionsWithIndex(final Function2<Integer, Iterator<T>, Iterator<R>> f,
	final boolean preservesPartitioning) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T>[] randomSplit(final double[] weights) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T>[] randomSplit(final double[] weights, final long seed) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> repartition(final int numPartitions) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> sample(final boolean withReplacement, final double fraction) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> sample(final boolean withReplacement, final double fraction, final long seed) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> setName(final String name) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <S> SparkJavaRDD<T> sortBy(final Function<T, S> f, final boolean ascending, final int numPartitions) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> unpersist() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaRDD<T> unpersist(final boolean blocking) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <K2, V2> SparkJavaPairRDD<K2, V2> flatMapToPair(final PairFlatMapFunction<T, K2, V2> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> SparkJavaPairRDD<U, Iterable<T>> groupBy(final Function<T, U> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> SparkJavaPairRDD<U, Iterable<T>> groupBy(final Function<T, U> f, final int numPartitions) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> SparkJavaPairRDD<U, T> keyBy(final Function<T, U> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <K2, V2> SparkJavaPairRDD<K2, V2> mapPartitionsToPair(final PairFlatMapFunction<Iterator<T>, K2, V2> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <K2, V2> SparkJavaPairRDD<K2, V2> mapPartitionsToPair(
	final PairFlatMapFunction<java.util.Iterator<T>, K2, V2> f,
	final boolean preservesPartitioning) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaPairRDD<T, Long> zipWithIndex() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public SparkJavaPairRDD<T, Long> zipWithUniqueId() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	/////////////// ACTIONS ///////////////

	@Override
	public <U> U aggregate(final U zeroValue, final Function2<U, T, U> seqOp, final Function2<U, U, U> combOp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public void checkpoint() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}


	@Override
	public JavaFutureAction<List<T>> collectAsync() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T>[] collectPartitions(final int[] partitionIds) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public long count() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public PartialResult<BoundedDouble> countApprox(final long timeout) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public PartialResult<BoundedDouble> countApprox(final long timeout, final double confidence) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public long countApproxDistinct(final double relativeSD) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public JavaFutureAction<Long> countAsync() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public Map<T, Long> countByValue() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public PartialResult<Map<T, BoundedDouble>> countByValueApprox(final long timeout) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public PartialResult<Map<T, BoundedDouble>> countByValueApprox(final long timeout, final double confidence) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T first() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T fold(final T zeroValue, final Function2<T, T, T> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public void foreach(final VoidFunction<T> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public JavaFutureAction<Void> foreachAsync(final VoidFunction<T> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public void foreachPartition(final VoidFunction<Iterator<T>> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public JavaFutureAction<Void> foreachPartitionAsync(final VoidFunction<Iterator<T>> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public Optional<String> getCheckpointFile() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public int getNumPartitions() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public StorageLevel getStorageLevel() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public int id() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public boolean isCheckpointed() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public boolean isEmpty() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public Iterator<T> iterator(final Partition split, final TaskContext taskContext) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T max(final Comparator<T> comp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T min(final Comparator<T> comp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public String name() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public org.apache.spark.api.java.Optional<Partitioner> partitioner() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<Partition> partitions() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public void saveAsObjectFile(final String path) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public void saveAsTextFile(final String path,
	final Class<? extends org.apache.hadoop.io.compress.CompressionCodec> codec) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> take(final int num) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public JavaFutureAction<List<T>> takeAsync(final int num) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> takeOrdered(final int num) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> takeOrdered(final int num, final Comparator<T> comp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> takeSample(final boolean withReplacement, final int num) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> takeSample(final boolean withReplacement, final int num, final long seed) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public String toDebugString() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public Iterator<T> toLocalIterator() {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> top(final int num) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public List<T> top(final int num, final Comparator<T> comp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> U treeAggregate(final U zeroValue, final Function2<U, T, U> seqOp, final Function2<U, U, U> combOp) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public <U> U treeAggregate(final U zeroValue, final Function2<U, T, U> seqOp,
	final Function2<U, U, U> combOp, final int depth) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T treeReduce(final Function2<T, T, T> f) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}

	@Override
	public T treeReduce(final Function2<T, T, T> f, final int depth) {
	throw new UnsupportedOperationException(NOT_YET_SUPPORTED);
	}
	}