blob: 6135d45d203386aa7b06f6f1b53492a46a0e15e4 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.sysds.runtime.instructions.spark;
import org.apache.spark.api.java.JavaPairRDD;
import org.apache.spark.api.java.function.Function;
import org.apache.sysds.runtime.controlprogram.context.ExecutionContext;
import org.apache.sysds.runtime.controlprogram.context.SparkExecutionContext;
import org.apache.sysds.runtime.instructions.cp.CPOperand;
import org.apache.sysds.runtime.instructions.spark.data.PartitionedBroadcast;
import org.apache.sysds.runtime.matrix.data.FrameBlock;
import org.apache.sysds.runtime.matrix.data.MatrixBlock;
import org.apache.sysds.runtime.matrix.operators.Operator;
public class BinaryFrameMatrixSPInstruction extends BinarySPInstruction {
protected BinaryFrameMatrixSPInstruction(Operator op, CPOperand in1, CPOperand in2, CPOperand out, String opcode, String istr) {
super(SPType.Binary, op, in1, in2, out, opcode, istr);
}
@Override
public void processInstruction(ExecutionContext ec) {
SparkExecutionContext sec = (SparkExecutionContext) ec;
// Get input RDDs
JavaPairRDD<Long, FrameBlock> in1 = sec.getFrameBinaryBlockRDDHandleForVariable(input1.getName());
// get feature length matrix
PartitionedBroadcast<MatrixBlock> feaLen = sec.getBroadcastForVariable(input2.getName());
JavaPairRDD<Long, FrameBlock> out = in1.mapValues(new DropInvalidLengths(feaLen));
//set output RDD
sec.setRDDHandleForVariable(output.getName(), out);
sec.addLineageRDD(output.getName(), input1.getName());
sec.addLineageBroadcast(output.getName(), input2.getName());
}
private static class DropInvalidLengths implements Function<FrameBlock,FrameBlock> {
private static final long serialVersionUID = 5850400295183766400L;
private PartitionedBroadcast<MatrixBlock> featureLength = null;
public DropInvalidLengths(PartitionedBroadcast<MatrixBlock> fl) {
featureLength = fl;
}
@Override public FrameBlock call(FrameBlock frameBlock) throws Exception {
int idx = (int)featureLength.getNumRows();
FrameBlock fb = frameBlock.invalidByLength(featureLength.getBlock(1, idx));
return fb;
}
}
}