src/main/java/org/apache/sysds/runtime/controlprogram/parfor/RemoteDPParForSparkWorker.java - systemds - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 package org.apache.sysds.runtime.controlprogram.parfor;

 import org.apache.hadoop.io.Writable;
 import org.apache.spark.TaskContext;
 import org.apache.spark.api.java.function.PairFlatMapFunction;
 import org.apache.spark.util.LongAccumulator;
 import org.apache.sysds.common.Types.FileFormat;
 import org.apache.sysds.runtime.DMLRuntimeException;
 import org.apache.sysds.runtime.codegen.CodegenUtils;
 import org.apache.sysds.runtime.controlprogram.ParForProgramBlock.PDataPartitionFormat;
 import org.apache.sysds.runtime.controlprogram.ParForProgramBlock.PartitionFormat;
 import org.apache.sysds.runtime.controlprogram.caching.CacheableData;
 import org.apache.sysds.runtime.controlprogram.caching.MatrixObject;
 import org.apache.sysds.runtime.controlprogram.parfor.Task.TaskType;
 import org.apache.sysds.runtime.controlprogram.parfor.stat.InfrastructureAnalyzer;
 import org.apache.sysds.runtime.controlprogram.parfor.util.PairWritableBlock;
 import org.apache.sysds.runtime.controlprogram.parfor.util.PairWritableCell;
 import org.apache.sysds.runtime.instructions.cp.IntObject;
 import org.apache.sysds.runtime.matrix.data.MatrixBlock;
 import org.apache.sysds.runtime.meta.DataCharacteristics;
 import org.apache.sysds.runtime.util.ProgramConverter;
 import scala.Tuple2;

 import java.io.IOException;
 import java.util.Collection;
 import java.util.HashMap;
 import java.util.Iterator;
 import java.util.Map.Entry;

 public class RemoteDPParForSparkWorker extends ParWorker implements PairFlatMapFunction<Iterator<Tuple2<Long, Iterable<Writable>>>, Long, String>
 {
 	private static final long serialVersionUID = 30223759283155139L;

 	private final String  _prog;
 	private final HashMap<String, byte[]> _clsMap;
 	private final boolean _caching;
 	private final String _inputVar;
 	private final String _iterVar;

 	private final FileFormat _fmt;
 	private final int _rlen;
 	private final int _clen;
 	private final int _blen;
 	private final boolean _tSparseCol;
 	private final PDataPartitionFormat _dpf;

 	private final LongAccumulator _aTasks;
 	private final LongAccumulator _aIters;

 	public RemoteDPParForSparkWorker(String program, HashMap<String, byte[]> clsMap, String inputVar, String iterVar,
 		boolean cpCaching, DataCharacteristics mc, boolean tSparseCol, PartitionFormat dpf, FileFormat fmt,
 		LongAccumulator atasks, LongAccumulator aiters)
 	{
 		_prog = program;
 		_clsMap = clsMap;
 		_caching = cpCaching;
 		_inputVar = inputVar;
 		_iterVar = iterVar;
 		_fmt = fmt;

 		//setup spark accumulators
 		_aTasks = atasks;
 		_aIters = aiters;

 		//setup matrix block partition meta data
 		_rlen = (int)dpf.getNumRows(mc);
 		_clen = (int)dpf.getNumColumns(mc);
 		_blen = mc.getBlocksize();
 		_tSparseCol = tSparseCol;
 		_dpf = dpf._dpf;
 	}

 	@Override
 	public Iterator<Tuple2<Long, String>> call(Iterator<Tuple2<Long, Iterable<Writable>>> arg0)
 		throws Exception
 	{
 		//lazy parworker initialization
 		configureWorker( TaskContext.get().taskAttemptId() );

 		//process all matrix partitions of this data partition
 		MatrixBlock partition = null;
 		while( arg0.hasNext() )
 		{
 			Tuple2<Long,Iterable<Writable>> larg = arg0.next();

 			//collect input partition (check via equals because oinfo deserialized instance)
 			if( _fmt == FileFormat.BINARY )
 				partition = collectBinaryBlock( larg._2(), partition );
 			else
 				partition = collectBinaryCellInput( larg._2() );

 			//update in-memory matrix partition
 			MatrixObject mo = _ec.getMatrixObject( _inputVar );
 			mo.setInMemoryPartition( partition );

 			//create tasks for input data
 			Task lTask = new Task(_iterVar, TaskType.SET);
 			lTask.addIteration( new IntObject(larg._1()) );

 			//execute program
 			long numIter = getExecutedIterations();
 			super.executeTask( lTask );

 			//maintain accumulators
 			_aTasks.add( 1 );
 			_aIters.add( (int)(getExecutedIterations()-numIter) );
 		}

 		//write output if required (matrix indexed write)
 		return RemoteParForUtils.exportResultVariables(_workerID, _ec.getVariables(), _resultVars)
 			.stream().map(s -> new Tuple2<>(_workerID, s)).iterator();
 	}

 	private void configureWorker( long ID )
 		throws IOException
 	{
 		_workerID = ID;

 		//initialize codegen class cache (before program parsing)
 		for( Entry<String, byte[]> e : _clsMap.entrySet() )
 			CodegenUtils.getClassSync(e.getKey(), e.getValue());

 		//parse and setup parfor body program
 		ParForBody body = ProgramConverter.parseParForBody(_prog, (int)_workerID, true);
 		_childBlocks = body.getChildBlocks();
 		_ec          = body.getEc();
 		_resultVars  = body.getResultVariables();
 		_numTasks    = 0;
 		_numIters    = 0;

 		//setup the buffer pool
 		RemoteParForUtils.setupBufferPool(_workerID);

 		//ensure that resultvar files are not removed
 		super.pinResultVariables();

 		//enable/disable caching (if required and not in CP process)
 		if( !_caching && !InfrastructureAnalyzer.isLocalMode() )
 			CacheableData.disableCaching();
 	}

 	/**
 	 * Collects a matrixblock partition from a given input iterator over
 	 * binary blocks.
 	 *
 	 * Note it reuses the instance attribute _partition - multiple calls
 	 * will overwrite the result.
 	 *
 	 * @param valueList iterable writables
 	 * @param reuse matrix block partition for reuse
 	 * @return matrix block
 	 * @throws IOException if IOException occurs
 	 */
 	private MatrixBlock collectBinaryBlock( Iterable<Writable> valueList, MatrixBlock reuse )
 		throws IOException
 	{
 		//fast path for partition of single fragment (see pseudo grouping),
 		//which avoids unnecessary copies and reduces memory pressure
 		if( valueList instanceof Collection && ((Collection<Writable>)valueList).size()==1 ) {
 			return ((PairWritableBlock)valueList.iterator().next()).block;
 		}

 		//default: create or reuse target partition and copy individual partition fragments
 		//into this target, including nnz maintenance and potential dense-sparse format change
 		MatrixBlock partition = reuse;

 		try
 		{
 			//reset reuse block, keep configured representation
 			if( _tSparseCol )
 				partition = new MatrixBlock(_clen, _rlen, true);
 			else if( partition!=null )
 				partition.reset(_rlen, _clen, false);
 			else
 				partition = new MatrixBlock(_rlen, _clen, false);

 			long lnnz = 0;
 			for( Writable val : valueList ) {
 				PairWritableBlock pval = (PairWritableBlock) val;
 				int row_offset = (int)(pval.indexes.getRowIndex()-1)*_blen;
 				int col_offset = (int)(pval.indexes.getColumnIndex()-1)*_blen;
 				if( !partition.isInSparseFormat() ) //DENSE
 					partition.copy( row_offset, row_offset+pval.block.getNumRows()-1,
 						col_offset, col_offset+pval.block.getNumColumns()-1,
 						pval.block, false );
 				else //SPARSE
 					partition.appendToSparse(pval.block, row_offset, col_offset);
 				lnnz += pval.block.getNonZeros();
 			}

 			//post-processing: cleanups if required
 			if( partition.isInSparseFormat() && _clen>_blen )
 				partition.sortSparseRows();
 			partition.setNonZeros(lnnz);
 			partition.examSparsity();
 		}
 		catch(DMLRuntimeException ex) {
 			throw new IOException(ex);
 		}

 		return partition;
 	}


 	/**
 	 * Collects a matrixblock partition from a given input iterator over
 	 * binary cells.
 	 *
 	 * Note it reuses the instance attribute _partition - multiple calls
 	 * will overwrite the result.
 	 *
 	 * @param valueList iterable writables
 	 * @return matrix block
 	 * @throws IOException if IOException occurs
 	 */
 	private MatrixBlock collectBinaryCellInput( Iterable<Writable> valueList )
 		throws IOException
 	{
 		MatrixBlock partition = null;

 		//reset reuse block, keep configured representation
 		if( _tSparseCol )
 			partition = new MatrixBlock(_clen, _rlen, true);
 		else
 			partition = new MatrixBlock(_rlen, _clen, false);

 		switch( _dpf )
 		{
 			case ROW_WISE:
 				while( valueList.iterator().hasNext() )
 				{
 					PairWritableCell pairValue = (PairWritableCell)valueList.iterator().next();
 					if( pairValue.indexes.getColumnIndex()<0 )
 						continue; //cells used to ensure empty partitions
 					partition.quickSetValue(0, (int)pairValue.indexes.getColumnIndex()-1, pairValue.cell.getValue());
 				}
 				break;
 			case COLUMN_WISE:
 				while( valueList.iterator().hasNext() )
 				{
 					PairWritableCell pairValue = (PairWritableCell)valueList.iterator().next();
 					if( pairValue.indexes.getRowIndex()<0 )
 						continue; //cells used to ensure empty partitions
 					if( _tSparseCol )
 						partition.appendValue(0,(int)pairValue.indexes.getRowIndex()-1, pairValue.cell.getValue());
 					else
 						partition.quickSetValue((int)pairValue.indexes.getRowIndex()-1, 0, pairValue.cell.getValue());
 				}
 				break;
 			default:
 				throw new IOException("Partition format not yet supported in fused partition-execute: "+_dpf);
 		}

 		//post-processing: cleanups if required
 		try {
 			if( partition.isInSparseFormat() && _tSparseCol )
 				partition.sortSparseRows();
 			partition.recomputeNonZeros();
 			partition.examSparsity();
 		}
 		catch(DMLRuntimeException ex) {
 			throw new IOException(ex);
 		}

 		return partition;
 	}
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing,
	* software distributed under the License is distributed on an
	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	* KIND, either express or implied. See the License for the
	* specific language governing permissions and limitations
	* under the License.
	*/

	package org.apache.sysds.runtime.controlprogram.parfor;

	import org.apache.hadoop.io.Writable;
	import org.apache.spark.TaskContext;
	import org.apache.spark.api.java.function.PairFlatMapFunction;
	import org.apache.spark.util.LongAccumulator;
	import org.apache.sysds.common.Types.FileFormat;
	import org.apache.sysds.runtime.DMLRuntimeException;
	import org.apache.sysds.runtime.codegen.CodegenUtils;
	import org.apache.sysds.runtime.controlprogram.ParForProgramBlock.PDataPartitionFormat;
	import org.apache.sysds.runtime.controlprogram.ParForProgramBlock.PartitionFormat;
	import org.apache.sysds.runtime.controlprogram.caching.CacheableData;
	import org.apache.sysds.runtime.controlprogram.caching.MatrixObject;
	import org.apache.sysds.runtime.controlprogram.parfor.Task.TaskType;
	import org.apache.sysds.runtime.controlprogram.parfor.stat.InfrastructureAnalyzer;
	import org.apache.sysds.runtime.controlprogram.parfor.util.PairWritableBlock;
	import org.apache.sysds.runtime.controlprogram.parfor.util.PairWritableCell;
	import org.apache.sysds.runtime.instructions.cp.IntObject;
	import org.apache.sysds.runtime.matrix.data.MatrixBlock;
	import org.apache.sysds.runtime.meta.DataCharacteristics;
	import org.apache.sysds.runtime.util.ProgramConverter;
	import scala.Tuple2;

	import java.io.IOException;
	import java.util.Collection;
	import java.util.HashMap;
	import java.util.Iterator;
	import java.util.Map.Entry;

	public class RemoteDPParForSparkWorker extends ParWorker implements PairFlatMapFunction<Iterator<Tuple2<Long, Iterable<Writable>>>, Long, String>
	{
	private static final long serialVersionUID = 30223759283155139L;

	private final String _prog;
	private final HashMap<String, byte[]> _clsMap;
	private final boolean _caching;
	private final String _inputVar;
	private final String _iterVar;

	private final FileFormat _fmt;
	private final int _rlen;
	private final int _clen;
	private final int _blen;
	private final boolean _tSparseCol;
	private final PDataPartitionFormat _dpf;

	private final LongAccumulator _aTasks;
	private final LongAccumulator _aIters;

	public RemoteDPParForSparkWorker(String program, HashMap<String, byte[]> clsMap, String inputVar, String iterVar,
	boolean cpCaching, DataCharacteristics mc, boolean tSparseCol, PartitionFormat dpf, FileFormat fmt,
	LongAccumulator atasks, LongAccumulator aiters)
	{
	_prog = program;
	_clsMap = clsMap;
	_caching = cpCaching;
	_inputVar = inputVar;
	_iterVar = iterVar;
	_fmt = fmt;

	//setup spark accumulators
	_aTasks = atasks;
	_aIters = aiters;

	//setup matrix block partition meta data
	_rlen = (int)dpf.getNumRows(mc);
	_clen = (int)dpf.getNumColumns(mc);
	_blen = mc.getBlocksize();
	_tSparseCol = tSparseCol;
	_dpf = dpf._dpf;
	}

	@Override
	public Iterator<Tuple2<Long, String>> call(Iterator<Tuple2<Long, Iterable<Writable>>> arg0)
	throws Exception
	{
	//lazy parworker initialization
	configureWorker( TaskContext.get().taskAttemptId() );

	//process all matrix partitions of this data partition
	MatrixBlock partition = null;
	while( arg0.hasNext() )
	{
	Tuple2<Long,Iterable<Writable>> larg = arg0.next();

	//collect input partition (check via equals because oinfo deserialized instance)
	if( _fmt == FileFormat.BINARY )
	partition = collectBinaryBlock( larg._2(), partition );
	else
	partition = collectBinaryCellInput( larg._2() );

	//update in-memory matrix partition
	MatrixObject mo = _ec.getMatrixObject( _inputVar );
	mo.setInMemoryPartition( partition );

	//create tasks for input data
	Task lTask = new Task(_iterVar, TaskType.SET);
	lTask.addIteration( new IntObject(larg._1()) );

	//execute program
	long numIter = getExecutedIterations();
	super.executeTask( lTask );

	//maintain accumulators
	_aTasks.add( 1 );
	_aIters.add( (int)(getExecutedIterations()-numIter) );
	}

	//write output if required (matrix indexed write)
	return RemoteParForUtils.exportResultVariables(_workerID, _ec.getVariables(), _resultVars)
	.stream().map(s -> new Tuple2<>(_workerID, s)).iterator();
	}

	private void configureWorker( long ID )
	throws IOException
	{
	_workerID = ID;

	//initialize codegen class cache (before program parsing)
	for( Entry<String, byte[]> e : _clsMap.entrySet() )
	CodegenUtils.getClassSync(e.getKey(), e.getValue());

	//parse and setup parfor body program
	ParForBody body = ProgramConverter.parseParForBody(_prog, (int)_workerID, true);
	_childBlocks = body.getChildBlocks();
	_ec = body.getEc();
	_resultVars = body.getResultVariables();
	_numTasks = 0;
	_numIters = 0;

	//setup the buffer pool
	RemoteParForUtils.setupBufferPool(_workerID);

	//ensure that resultvar files are not removed
	super.pinResultVariables();

	//enable/disable caching (if required and not in CP process)
	if( !_caching && !InfrastructureAnalyzer.isLocalMode() )
	CacheableData.disableCaching();
	}

	/**
	* Collects a matrixblock partition from a given input iterator over
	* binary blocks.
	*
	* Note it reuses the instance attribute _partition - multiple calls
	* will overwrite the result.
	*
	* @param valueList iterable writables
	* @param reuse matrix block partition for reuse
	* @return matrix block
	* @throws IOException if IOException occurs
	*/
	private MatrixBlock collectBinaryBlock( Iterable<Writable> valueList, MatrixBlock reuse )
	throws IOException
	{
	//fast path for partition of single fragment (see pseudo grouping),
	//which avoids unnecessary copies and reduces memory pressure
	if( valueList instanceof Collection && ((Collection<Writable>)valueList).size()==1 ) {
	return ((PairWritableBlock)valueList.iterator().next()).block;
	}

	//default: create or reuse target partition and copy individual partition fragments
	//into this target, including nnz maintenance and potential dense-sparse format change
	MatrixBlock partition = reuse;

	try
	{
	//reset reuse block, keep configured representation
	if( _tSparseCol )
	partition = new MatrixBlock(_clen, _rlen, true);
	else if( partition!=null )
	partition.reset(_rlen, _clen, false);
	else
	partition = new MatrixBlock(_rlen, _clen, false);

	long lnnz = 0;
	for( Writable val : valueList ) {
	PairWritableBlock pval = (PairWritableBlock) val;
	int row_offset = (int)(pval.indexes.getRowIndex()-1)*_blen;
	int col_offset = (int)(pval.indexes.getColumnIndex()-1)*_blen;
	if( !partition.isInSparseFormat() ) //DENSE
	partition.copy( row_offset, row_offset+pval.block.getNumRows()-1,
	col_offset, col_offset+pval.block.getNumColumns()-1,
	pval.block, false );
	else //SPARSE
	partition.appendToSparse(pval.block, row_offset, col_offset);
	lnnz += pval.block.getNonZeros();
	}

	//post-processing: cleanups if required
	if( partition.isInSparseFormat() && _clen>_blen )
	partition.sortSparseRows();
	partition.setNonZeros(lnnz);
	partition.examSparsity();
	}
	catch(DMLRuntimeException ex) {
	throw new IOException(ex);
	}

	return partition;
	}


	/**
	* Collects a matrixblock partition from a given input iterator over
	* binary cells.
	*
	* Note it reuses the instance attribute _partition - multiple calls
	* will overwrite the result.
	*
	* @param valueList iterable writables
	* @return matrix block
	* @throws IOException if IOException occurs
	*/
	private MatrixBlock collectBinaryCellInput( Iterable<Writable> valueList )
	throws IOException
	{
	MatrixBlock partition = null;

	//reset reuse block, keep configured representation
	if( _tSparseCol )
	partition = new MatrixBlock(_clen, _rlen, true);
	else
	partition = new MatrixBlock(_rlen, _clen, false);

	switch( _dpf )
	{
	case ROW_WISE:
	while( valueList.iterator().hasNext() )
	{
	PairWritableCell pairValue = (PairWritableCell)valueList.iterator().next();
	if( pairValue.indexes.getColumnIndex()<0 )
	continue; //cells used to ensure empty partitions
	partition.quickSetValue(0, (int)pairValue.indexes.getColumnIndex()-1, pairValue.cell.getValue());
	}
	break;
	case COLUMN_WISE:
	while( valueList.iterator().hasNext() )
	{
	PairWritableCell pairValue = (PairWritableCell)valueList.iterator().next();
	if( pairValue.indexes.getRowIndex()<0 )
	continue; //cells used to ensure empty partitions
	if( _tSparseCol )
	partition.appendValue(0,(int)pairValue.indexes.getRowIndex()-1, pairValue.cell.getValue());
	else
	partition.quickSetValue((int)pairValue.indexes.getRowIndex()-1, 0, pairValue.cell.getValue());
	}
	break;
	default:
	throw new IOException("Partition format not yet supported in fused partition-execute: "+_dpf);
	}

	//post-processing: cleanups if required
	try {
	if( partition.isInSparseFormat() && _tSparseCol )
	partition.sortSparseRows();
	partition.recomputeNonZeros();
	partition.examSparsity();
	}
	catch(DMLRuntimeException ex) {
	throw new IOException(ex);
	}

	return partition;
	}
	}