blob: c2bcbbf02838c8075f38577e1a571bf68380ae43 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.sysds.test.functions.quaternary;
import java.util.HashMap;
import org.junit.AfterClass;
import org.junit.Assert;
import org.junit.BeforeClass;
import org.junit.Test;
import org.apache.sysds.api.DMLScript;
import org.apache.sysds.common.Types.ExecMode;
import org.apache.sysds.hops.OptimizerUtils;
import org.apache.sysds.hops.QuaternaryOp;
import org.apache.sysds.lops.WeightedSquaredLoss;
import org.apache.sysds.lops.WeightedSquaredLossR;
import org.apache.sysds.lops.LopProperties.ExecType;
import org.apache.sysds.runtime.instructions.Instruction;
import org.apache.sysds.runtime.matrix.data.MatrixValue.CellIndex;
import org.apache.sysds.runtime.meta.MatrixCharacteristics;
import org.apache.sysds.test.AutomatedTestBase;
import org.apache.sysds.test.TestConfiguration;
import org.apache.sysds.test.TestUtils;
import org.apache.sysds.utils.Statistics;
/**
*
*
*/
public class WeightedSquaredLossTest extends AutomatedTestBase
{
private final static String TEST_NAME1 = "WeightedSquaredLossPost";
private final static String TEST_NAME2 = "WeightedSquaredLossPre";
private final static String TEST_NAME3 = "WeightedSquaredLossNo";
private final static String TEST_NAME4 = "WeightedSquaredLossPost2";
private final static String TEST_NAME5 = "WeightedSquaredLossPre2";
private final static String TEST_NAME6 = "WeightedSquaredLossNo2";
private final static String TEST_NAME7 = "WeightedSquaredLossPostNz";
private final static String TEST_DIR = "functions/quaternary/";
private final static String TEST_CLASS_DIR = TEST_DIR + WeightedSquaredLossTest.class.getSimpleName() + "/";
private final static double eps = 1e-6;
private final static int rows = 1201;
private final static int cols = 1103;
private final static int rank = 10;
private final static double spSparse = 0.001;
private final static double spDense = 0.6;
@Override
public void setUp()
{
addTestConfiguration(TEST_NAME1, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME1, new String[]{"R"}));
addTestConfiguration(TEST_NAME2, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME2, new String[]{"R"}));
addTestConfiguration(TEST_NAME3, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME3, new String[]{"R"}));
addTestConfiguration(TEST_NAME4, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME4, new String[]{"R"}));
addTestConfiguration(TEST_NAME5, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME5, new String[]{"R"}));
addTestConfiguration(TEST_NAME6, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME6, new String[]{"R"}));
addTestConfiguration(TEST_NAME7, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME7, new String[]{"R"}));
if (TEST_CACHE_ENABLED) {
setOutAndExpectedDeletionDisabled(true);
}
}
@BeforeClass
public static void init()
{
TestUtils.clearDirectory(TEST_DATA_DIR + TEST_CLASS_DIR);
}
@AfterClass
public static void cleanUp()
{
if (TEST_CACHE_ENABLED) {
TestUtils.clearDirectory(TEST_DATA_DIR + TEST_CLASS_DIR);
}
}
@Test
public void testSquaredLossDensePostWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME1, false, false, ExecType.CP);
}
@Test
public void testSquaredLossDensePreWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME2, false, false, ExecType.CP);
}
@Test
public void testSquaredLossDenseNoWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME3, false, false, ExecType.CP);
}
@Test
public void testSquaredLossSparsePostWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME1, true, false, ExecType.CP);
}
@Test
public void testSquaredLossSparsePreWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME2, true, false, ExecType.CP);
}
@Test
public void testSquaredLossSparseNoWeightsNoRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME3, true, false, ExecType.CP);
}
@Test
public void testSquaredLossDensePostWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME1, false, true, ExecType.CP);
}
@Test
public void testSquaredLossDensePreWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME2, false, true, ExecType.CP);
}
@Test
public void testSquaredLossDenseNoWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME3, false, true, ExecType.CP);
}
@Test
public void testSquaredLossSparsePostWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME1, true, true, ExecType.CP);
}
@Test
public void testSquaredLossSparsePreWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME2, true, true, ExecType.CP);
}
@Test
public void testSquaredLossSparseNoWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME3, true, true, ExecType.CP);
}
@Test
public void testSquaredLossDensePostWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME1, false, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDensePreWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME2, false, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDenseNoWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME3, false, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparsePostWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME1, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparsePreWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME2, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparseNoWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME3, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDensePostNzWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME7, false, true, ExecType.CP);
}
@Test
public void testSquaredLossSparsePostNzWeightsRewritesCP()
{
runMLUnaryBuiltinTest(TEST_NAME7, true, true, ExecType.CP);
}
@Test
public void testSquaredLossDensePostNzWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME7, false, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparsePostNzWeightsRewritesSP()
{
runMLUnaryBuiltinTest(TEST_NAME7, true, true, ExecType.SPARK);
}
//the following tests force the replication based mr operator because
//otherwise we would always choose broadcasts for this small input data
@Test
public void testSquaredLossSparsePostWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME1, true, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparsePreWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME2, true, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparseNoWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME3, true, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDensePostWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME1, false, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDensePreWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME2, false, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDenseNoWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME3, false, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossSparsePostNzWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME7, true, true, true, ExecType.SPARK);
}
@Test
public void testSquaredLossDensePostNzWeightsRewritesRepSP()
{
runMLUnaryBuiltinTest(TEST_NAME7, false, true, true, ExecType.SPARK);
}
// the following tests use a sightly different pattern of U%*%t(V)-X
// which applies as well due to the subsequent squaring.
@Test
public void testSquaredLossDensePostWeightsRewrites2CP()
{
runMLUnaryBuiltinTest(TEST_NAME4, false, true, ExecType.CP);
}
@Test
public void testSquaredLossDensePreWeightsRewrites2CP()
{
runMLUnaryBuiltinTest(TEST_NAME5, false, true, ExecType.CP);
}
@Test
public void testSquaredLossDenseNoWeightsRewrites2CP()
{
runMLUnaryBuiltinTest(TEST_NAME6, false, true, ExecType.CP);
}
/**
*
* @param testname
* @param sparse
* @param rewrites
* @param instType
*/
private void runMLUnaryBuiltinTest( String testname, boolean sparse, boolean rewrites, ExecType instType)
{
runMLUnaryBuiltinTest(testname, sparse, rewrites, false, instType);
}
private void runMLUnaryBuiltinTest( String testname, boolean sparse, boolean rewrites, boolean rep, ExecType instType)
{
ExecMode platformOld = rtplatform;
switch( instType ){
case SPARK: rtplatform = ExecMode.SPARK; break;
default: rtplatform = ExecMode.HYBRID; break;
}
boolean sparkConfigOld = DMLScript.USE_LOCAL_SPARK_CONFIG;
if( rtplatform == ExecMode.SPARK )
DMLScript.USE_LOCAL_SPARK_CONFIG = true;
boolean rewritesOld = OptimizerUtils.ALLOW_ALGEBRAIC_SIMPLIFICATION;
boolean forceOld = QuaternaryOp.FORCE_REPLICATION;
OptimizerUtils.ALLOW_ALGEBRAIC_SIMPLIFICATION = rewrites;
QuaternaryOp.FORCE_REPLICATION = rep;
try
{
double sparsity = (sparse) ? spSparse : spDense;
String TEST_NAME = testname;
TestConfiguration config = getTestConfiguration(TEST_NAME);
String TEST_CACHE_DIR = "";
if (TEST_CACHE_ENABLED)
{
TEST_CACHE_DIR = TEST_NAME + "_" + sparsity + "/";
}
loadTestConfiguration(config, TEST_CACHE_DIR);
// This is for running the junit test the new way, i.e., construct the arguments directly
String HOME = SCRIPT_DIR + TEST_DIR;
fullDMLScriptName = HOME + TEST_NAME + ".dml";
programArgs = new String[]{"-stats", "-explain", "runtime", "-args",
input("X"), input("U"), input("V"), input("W"), output("R") };
fullRScriptName = HOME + TEST_NAME + ".R";
rCmd = "Rscript" + " " + fullRScriptName + " " + inputDir() + " " + expectedDir();
//generate actual dataset
double[][] X = getRandomMatrix(rows, cols, 0, 1, sparsity, 7);
writeInputMatrixWithMTD("X", X, true);
double[][] U = getRandomMatrix(rows, rank, 0, 1, 1.0, 213);
writeInputMatrixWithMTD("U", U, true);
double[][] V = getRandomMatrix(cols, rank, 0, 1, 1.0, 312);
writeInputMatrixWithMTD("V", V, true);
if( !TEST_NAME.equals(TEST_NAME3) ) {
double[][] W = getRandomMatrix(rows, cols, 0, 1, sparsity, 1467);
writeInputMatrixWithMTD("W", W, true);
}
runTest(true, false, null, -1);
runRScript(true);
//compare matrices
HashMap<CellIndex, Double> dmlfile = readDMLMatrixFromOutputDir("R");
HashMap<CellIndex, Double> rfile = readRMatrixFromExpectedDir("R");
TestUtils.compareMatrices(dmlfile, rfile, eps, "Stat-DML", "Stat-R");
checkDMLMetaDataFile("R", new MatrixCharacteristics(1,1,1,1));
//check statistics for right operator in cp
if( instType == ExecType.CP && rewrites )
Assert.assertTrue("Rewrite not applied.",Statistics.getCPHeavyHitterOpCodes().contains(WeightedSquaredLoss.OPCODE_CP));
else if( instType == ExecType.SPARK && rewrites ){
boolean noWeights = testname.equals(TEST_NAME3) || testname.equals(TEST_NAME6) || testname.equals(TEST_NAME7);
String opcode = Instruction.SP_INST_PREFIX+((rep || !noWeights)?WeightedSquaredLossR.OPCODE : WeightedSquaredLoss.OPCODE);
Assert.assertTrue("Rewrite not applied.",Statistics.getCPHeavyHitterOpCodes().contains(opcode));
}
}
finally
{
rtplatform = platformOld;
DMLScript.USE_LOCAL_SPARK_CONFIG = sparkConfigOld;
OptimizerUtils.ALLOW_ALGEBRAIC_SIMPLIFICATION = rewritesOld;
QuaternaryOp.FORCE_REPLICATION = forceOld;
}
}
}