| # ------------------------------------------------------------- |
| # |
| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| # |
| # ------------------------------------------------------------- |
| |
| import unittest |
| |
| import numpy as np |
| from systemds.context import SystemDSContext |
| from systemds.matrix import Matrix |
| from systemds.operator.algorithm import multiLogReg, multiLogRegPredict |
| |
| |
| class TestMultiLogReg(unittest.TestCase): |
| |
| sds: SystemDSContext = None |
| |
| @classmethod |
| def setUpClass(cls): |
| cls.sds = SystemDSContext() |
| |
| @classmethod |
| def tearDownClass(cls): |
| cls.sds.close() |
| |
| def test_simple(self): |
| """ |
| Test simple, if the log reg splits a dataset where everything over 1 is label 2 and under 1 is 1. |
| With manual classification. |
| """ |
| [X, labels, Y] = self.gen_data() |
| |
| # Call algorithm |
| bias = multiLogReg(Matrix(self.sds,X),Matrix(self.sds,Y)).compute() |
| |
| # Calculate result. |
| res = np.reshape(np.dot(X, bias[:len(X[0])]) + bias[len(X[0])], (250)) |
| f2 = lambda x: (x < 0) + 1 |
| accuracy = np.sum(labels == f2(res)) / 250 * 100 |
| |
| self.assertTrue(accuracy > 98) |
| |
| def test_using_predict(self): |
| """ |
| Test the algorithm using the predict function. |
| With builtin classification |
| """ |
| [X, labels, Y] = self.gen_data() |
| # Call algorithm |
| bias = multiLogReg(Matrix(self.sds,X),Matrix(self.sds,Y)).compute() |
| |
| [m, y_pred, acc] = multiLogRegPredict(Matrix(self.sds,X),Matrix(self.sds,bias), Matrix(self.sds,Y)).compute() |
| |
| self.assertTrue(acc > 98) |
| |
| |
| def gen_data(self): |
| np.random.seed(13241) |
| # Generate data |
| mu, sigma = 1, 0.1 |
| X = np.reshape(np.random.normal(mu, sigma, 500), (2,250)) |
| # All over 1 is true |
| f = lambda x: (x[0] > 1) + 1 |
| labels = f(X) |
| # Y labels as double |
| Y = np.array(labels, dtype=np.double) |
| # Transpose X to fit input format. |
| X = X.transpose() |
| return X, labels, Y |
| |
| if __name__ == "__main__": |
| unittest.main(exit=False) |