| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.sysds.test.functions.builtin; |
| |
| import org.junit.Assert; |
| import org.junit.Test; |
| import org.apache.sysds.common.Types; |
| import org.apache.sysds.common.Types.FileFormat; |
| import org.apache.sysds.lops.LopProperties; |
| import org.apache.sysds.runtime.io.FrameWriter; |
| import org.apache.sysds.runtime.io.FrameWriterFactory; |
| import org.apache.sysds.runtime.matrix.data.FrameBlock; |
| import org.apache.sysds.runtime.util.UtilFunctions; |
| import org.apache.sysds.test.AutomatedTestBase; |
| import org.apache.sysds.test.TestConfiguration; |
| import org.apache.sysds.test.TestUtils; |
| |
| import java.io.IOException; |
| |
| public class BuiltinImputeFDTest extends AutomatedTestBase { |
| |
| private final static String TEST_NAME = "imputeFD"; |
| private final static String TEST_DIR = "functions/builtin/"; |
| private static final String TEST_CLASS_DIR = TEST_DIR + BuiltinImputeFDTest.class.getSimpleName() + "/"; |
| private final static int rows = 11; |
| private final static int cols = 4; |
| private final static double epsilon = 0.0000000001; |
| |
| private final static Types.ValueType[] schema = {Types.ValueType.BOOLEAN, Types.ValueType.STRING, Types.ValueType.STRING, Types.ValueType.FP64}; |
| |
| @Override |
| public void setUp() { |
| TestUtils.clearAssertionInformation(); |
| addTestConfiguration(TEST_NAME, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME, new String[] {"C"})); |
| } |
| |
| @Test |
| public void test1() throws IOException { |
| runImpute_RFDTests(2,3, 0.6, 1, LopProperties.ExecType.CP); |
| } |
| |
| @Test |
| public void test2() throws IOException { |
| runImpute_RFDTests(2,3, 0.45, 2, LopProperties.ExecType.CP); |
| } |
| |
| @Test |
| public void test3() throws IOException { |
| runImpute_RFDTests(2,3, 0.6, 1, LopProperties.ExecType.SPARK); |
| } |
| |
| @Test |
| public void test4() throws IOException { |
| runImpute_RFDTests(2,3, 0.4, 2, LopProperties.ExecType.SPARK); |
| } |
| private void runImpute_RFDTests(int source, int target, double threshold, int test, LopProperties.ExecType instType) |
| throws IOException |
| { |
| Types.ExecMode platformOld = setExecMode(instType); |
| try { |
| loadTestConfiguration(getTestConfiguration(TEST_NAME)); |
| String HOME = SCRIPT_DIR + TEST_DIR; |
| fullDMLScriptName = HOME + TEST_NAME + ".dml"; |
| programArgs = new String[] {"-args", input("A"), String.valueOf(source),String.valueOf(target), String.valueOf(threshold), output("B")}; // |
| //initialize the frame data. |
| FrameBlock frame1 = new FrameBlock(schema); |
| FrameWriter writer = FrameWriterFactory.createFrameWriter(FileFormat.CSV); |
| double[][] A = getRandomMatrix(rows, cols, 0, 1, 0.7, -1); |
| initFrameDataString(frame1, A, test); |
| writer.writeFrameToHDFS(frame1.slice(0, rows - 1, 0, schema.length - 1, new FrameBlock()), |
| input("A"), rows, schema.length); |
| |
| runTest(true, false, null, -1); |
| FrameBlock frameRead = readDMLFrameFromHDFS("B", FileFormat.BINARY); |
| FrameBlock realFrame = tureOutput(A); |
| verifyFrameData(frameRead, realFrame, schema); |
| } |
| finally { |
| rtplatform = platformOld; |
| } |
| } |
| |
| private static void initFrameDataString(FrameBlock frame1, double[][] data, int test) { |
| boolean[] b = new boolean[rows]; |
| long[] l = new long[rows]; |
| String[] s1 = null, s2 = null; |
| for (int i = 0; i < rows; i++) { |
| data[i][1] = (b[i] = (Boolean) UtilFunctions.doubleToObject(Types.ValueType.BOOLEAN, data[i][1], false)) ? 1 : 0; |
| l[i] = (Long) UtilFunctions.doubleToObject(Types.ValueType.INT64, data[i][2], false); |
| } |
| switch (test) |
| { |
| case 1: |
| s1 = new String[] {"TU-Graz", "TU-Graz", "TU-Graz", "IIT", "IIT", "IIT", "IIT", "SIBA", "SIBA", "SIBA", "TU-Wien"}; |
| s2 = new String[] {"Austria", "Austria", "Austria", "India", "IIT", "India", "India", "Pakistan", "Pakistan", "Austria", "Austria"}; |
| break; |
| case 2: |
| s1 = new String[] {"TU-Graz", "TU-Graz", "TU-Graz", "IIT", "IIT", "IIT", "IIT", "SIBA", "SIBA", "SIBA", "TU-Wien"}; |
| s2 = new String[] {"Austria", "Austria", "Austria", "India", "IIT", "In","India", "Pakistan", "Pakistan", null,"Austria"}; |
| break; |
| } |
| |
| frame1.appendColumn(b); |
| frame1.appendColumn(s1); |
| frame1.appendColumn(s2); |
| frame1.appendColumn(l); |
| } |
| |
| private static FrameBlock tureOutput(double[][] data) { |
| FrameBlock frame1 = new FrameBlock(schema); |
| boolean[] b = new boolean[rows]; |
| String[] s1 = {"TU-Graz", "TU-Graz", "TU-Graz", "IIT", "IIT", "IIT","IIT", "SIBA", "SIBA", "SIBA", "TU-Wien"}; |
| String[] s2 = {"Austria", "Austria", "Austria", "India", "India", "India","India", "Pakistan", "Pakistan", "Pakistan", "Austria"}; |
| long[] l = new long[rows]; |
| for (int i = 0; i < rows; i++) { |
| data[i][1] = (b[i] = (Boolean) UtilFunctions.doubleToObject(Types.ValueType.BOOLEAN, data[i][1], false)) ? 1 : 0; |
| l[i] = (Long) UtilFunctions.doubleToObject(Types.ValueType.INT64, data[i][2], false); |
| } |
| frame1.appendColumn(b); |
| frame1.appendColumn(s1); |
| frame1.appendColumn(s2); |
| frame1.appendColumn(l); |
| return frame1; |
| } |
| |
| private static void verifyFrameData(FrameBlock frame1, FrameBlock frame2, Types.ValueType[] schema) { |
| for (int i = 0; i < frame1.getNumRows(); i++) |
| for (int j = 0; j < frame1.getNumColumns(); j++) { |
| Object val1 = UtilFunctions.stringToObject(schema[j], UtilFunctions.objectToString(frame1.get(i, j))); |
| Object val2 = UtilFunctions.stringToObject(schema[j], UtilFunctions.objectToString(frame2.get(i, j))); |
| if (TestUtils.compareToR(schema[j], val1, val2, epsilon) != 0) |
| Assert.fail("The DML data for cell (" + i + "," + j + ") is " + val1 + ", not same as the expected value " + val2); |
| } |
| } |
| } |