| /* |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, |
| * software distributed under the License is distributed on an |
| * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| * KIND, either express or implied. See the License for the |
| * specific language governing permissions and limitations |
| * under the License. |
| */ |
| |
| package org.apache.sysds.test.functions.jmlc; |
| |
| import java.io.IOException; |
| import java.util.ArrayList; |
| import java.util.HashMap; |
| |
| import org.junit.Test; |
| import org.apache.sysds.api.jmlc.Connection; |
| import org.apache.sysds.api.jmlc.PreparedScript; |
| import org.apache.sysds.api.jmlc.ResultVariables; |
| import org.apache.sysds.common.Types.FileFormat; |
| import org.apache.sysds.conf.CompilerConfig.ConfigType; |
| import org.apache.sysds.runtime.controlprogram.parfor.stat.Timing; |
| import org.apache.sysds.runtime.matrix.data.MatrixBlock; |
| import org.apache.sysds.runtime.matrix.data.MatrixValue.CellIndex; |
| import org.apache.sysds.runtime.util.DataConverter; |
| import org.apache.sysds.test.AutomatedTestBase; |
| import org.apache.sysds.test.TestConfiguration; |
| import org.apache.sysds.test.TestUtils; |
| |
| public class MulticlassSVMScoreTest extends AutomatedTestBase |
| { |
| private final static String TEST_NAME = "m-svm-score"; |
| private final static String TEST_DIR = "functions/jmlc/"; |
| private final static String MODEL_FILE = "sentiment_model.mtx"; |
| private final static double eps = 1e-10; |
| private final static String TEST_CLASS_DIR = TEST_DIR + MulticlassSVMScoreTest.class.getSimpleName() + "/"; |
| |
| private final static int rows = 107; |
| private final static int cols = 46; //fixed |
| |
| private final static int nRuns = 3; |
| |
| private final static double sparsity1 = 0.7; |
| private final static double sparsity2 = 0.1; |
| |
| @Override |
| public void setUp() { |
| addTestConfiguration(TEST_NAME, new TestConfiguration(TEST_CLASS_DIR, TEST_NAME, new String[] { "predicted_y" }) ); |
| } |
| |
| @Test |
| public void testJMLCMulticlassScoreDense() throws IOException { |
| runJMLCMulticlassTest(false, false); |
| } |
| |
| @Test |
| public void testJMLCMulticlassScoreSparse() throws IOException { |
| runJMLCMulticlassTest(true, false); |
| } |
| |
| @Test |
| public void testJMLCMulticlassScoreDenseFlags() throws IOException { |
| runJMLCMulticlassTest(false, true); |
| } |
| |
| @Test |
| public void testJMLCMulticlassScoreSparseFlags() throws IOException { |
| runJMLCMulticlassTest(true, true); |
| } |
| |
| private void runJMLCMulticlassTest( boolean sparse, boolean flags ) |
| throws IOException |
| { |
| TestConfiguration config = getTestConfiguration(TEST_NAME); |
| loadTestConfiguration(config); |
| |
| //generate inputs |
| ArrayList<double[][]> Xset = generateInputs(nRuns, rows, cols, sparse?sparsity2:sparsity1, 7); |
| |
| //run DML via JMLC |
| ArrayList<double[][]> Yset = execDMLScriptviaJMLC( Xset, flags ); |
| |
| //write out R input and model once |
| MatrixBlock mb = DataConverter.readMatrixFromHDFS(SCRIPT_DIR + TEST_DIR + MODEL_FILE, |
| FileFormat.TEXT, rows, cols, 1000, 1000); |
| writeInputMatrix("X", Xset.get(0), true); |
| writeInputMatrix("W", DataConverter.convertToDoubleMatrix(mb), true); |
| |
| //run R test once |
| String HOME = SCRIPT_DIR + TEST_DIR; |
| fullRScriptName = HOME + TEST_NAME + ".R"; |
| rCmd = getRCmd(inputDir(), expectedDir()); |
| runRScript(true); |
| |
| //read and convert R output |
| HashMap<CellIndex, Double> rfile = readRMatrixFromFS("predicted_y"); |
| double[][] expected = TestUtils.convertHashMapToDoubleArray(rfile, rows, 1); |
| |
| //for each input data set compare results |
| for( int i=0; i<nRuns; i++ ) |
| TestUtils.compareMatrices(expected, Yset.get(i), rows, 1, eps); |
| } |
| |
| private static ArrayList<double[][]> execDMLScriptviaJMLC(ArrayList<double[][]> X, boolean flags) |
| throws IOException |
| { |
| Timing time = new Timing(true); |
| ArrayList<double[][]> ret = new ArrayList<>(); |
| |
| try( Connection conn = !flags ? new Connection(): |
| new Connection(ConfigType.PARALLEL_CP_MATRIX_OPERATIONS, |
| ConfigType.PARALLEL_LOCAL_OR_REMOTE_PARFOR, |
| ConfigType.ALLOW_DYN_RECOMPILATION) ) |
| { |
| //read and precompile script |
| String script = conn.readScript(SCRIPT_DIR + TEST_DIR + TEST_NAME + ".dml"); |
| PreparedScript pstmt = conn.prepareScript(script, new String[]{"X","W"}, new String[]{"predicted_y"}); |
| |
| //read model |
| String modelData = conn.readScript(SCRIPT_DIR + TEST_DIR + MODEL_FILE ); |
| double[][] W = conn.convertToDoubleMatrix(modelData, rows, cols); |
| |
| //execute script multiple times |
| for( int i=0; i<nRuns; i++ ) |
| { |
| //bind input parameters |
| pstmt.setMatrix("W", W); |
| pstmt.setMatrix("X", X.get(i)); |
| |
| //execute script |
| ResultVariables rs = pstmt.executeScript(); |
| |
| //get output parameter |
| double[][] Y = rs.getMatrix("predicted_y"); |
| ret.add(Y); //keep result for comparison |
| } |
| } |
| catch(Exception ex) { |
| throw new IOException(ex); |
| } |
| |
| System.out.println("JMLC scoring w/ "+nRuns+" runs in "+time.stop()+"ms."); |
| |
| return ret; |
| } |
| |
| private ArrayList<double[][]> generateInputs( int num, int rows, int cols, double sparsity, int seed ) { |
| ArrayList<double[][]> ret = new ArrayList<>(); |
| for( int i=0; i<num; i++ ) |
| ret.add(getRandomMatrix(rows, cols, -1, 1, sparsity, seed)); |
| return ret; |
| } |
| } |