| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| |
| import mxnet as mx |
| from mxnet import nd |
| |
| from benchmark.opperf.utils.benchmark_utils import run_performance_test |
| from benchmark.opperf.utils.benchmark_utils import run_op_benchmarks |
| from benchmark.opperf.utils.op_registry_utils import get_all_optimizer_operators |
| from benchmark.opperf.utils.common_utils import merge_map_list |
| from benchmark.opperf.rules.default_params import MX_OP_MODULE |
| |
| """Performance benchmark tests for MXNet Neural Network Optimizer Update Operators. |
| |
| 1. Stochastic Gradient Descent (SGD) |
| 1.1 mp_sgd_update |
| 1.2 sgd_mom_update |
| 1.3 signsgd_update |
| 1.4 mp_sgd_mom_update |
| 1.5 sgd_update |
| 2. signum_update |
| 3. rmspropalex_update |
| 4. ftml_update |
| 5. rmsprop_update |
| 6. ftrl_update |
| 7. adam_update |
| 8. preloaded_multi_* |
| 8.1 preloaded_multi_sgd_mom_update |
| 8.2 preloaded_multi_sgd_update |
| 8.3 preloaded_multi_mp_sgd_update |
| 8.4 preloaded_multi_mp_sgd_mom_update |
| 9. lamb_* |
| 9.1 lamb_update_phase1 |
| 9.2 lamb_update_phase2 |
| 10. multi_* |
| 10.1 multi_sgd_update |
| 10.2 multi_sgd_mom_update |
| 10.3 multi_mp_sgd_update |
| 10.4 multi_mp_sgd_mom_update |
| """ |
| |
| |
| def run_optimizer_operators_benchmarks(ctx=mx.cpu(), dtype='float32', profiler='native', int64_tensor='off', warmup=25, runs=100): |
| """Runs benchmarks with the given context, precision (dtype), and input data size (int64_tensor) for all the neural network |
| optimizer update operators in MXNet. |
| |
| Parameters |
| ---------- |
| ctx: mx.ctx |
| Context to run benchmarks |
| dtype: str, default 'float32' |
| Precision to use for benchmarks |
| profiler: str, default 'native' |
| Type of Profiler to use (native/python) |
| int64_tensor: str, default 'off' |
| Input tensor size to use for tests (if on, dimensions >= 2**32) |
| warmup: int, default 25 |
| Number of times to run for warmup |
| runs: int, default 100 |
| Number of runs to capture benchmark results |
| |
| Returns |
| ------- |
| Dictionary of results. Key -> Name of the operator, Value -> Benchmark results. |
| |
| """ |
| standard_shape = (5, 5) |
| int64_tensor_shape = (2**16, 2**16) |
| |
| if int64_tensor == 'on': |
| arg_shape = int64_tensor_shape |
| else: |
| arg_shape = standard_shape |
| |
| # Run independent tests for ops that need specific input data |
| multi_mp_sgd_mom_res = run_performance_test([getattr(MX_OP_MODULE, "multi_mp_sgd_mom_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape), "args2": nd.random_normal(shape=arg_shape), |
| "args3": nd.random_normal(shape=arg_shape), "lrs": 0.1, "wds": 0.2, |
| "out": nd.random_normal(shape=arg_shape)}],run_backward=False) |
| |
| multi_sgd_mom_res = run_performance_test([getattr(MX_OP_MODULE, "multi_sgd_mom_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape),"args2": nd.random_normal(shape=arg_shape), |
| "lrs": 0.1, "wds": 0.2, "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| multi_sgd_res = run_performance_test([getattr(MX_OP_MODULE, "multi_sgd_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape), "lrs": 0.1, "wds": 0.2, |
| "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| multi_mp_sgd_res = run_performance_test([getattr(MX_OP_MODULE, "multi_mp_sgd_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape),"args2": nd.random_normal(shape=arg_shape), |
| "lrs": 0.1, "wds": 0.2, "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| preloaded_multi_mp_sgd_res = run_performance_test( |
| [getattr(MX_OP_MODULE, "preloaded_multi_mp_sgd_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape), "args2": nd.random_normal(shape=arg_shape), |
| "args3": nd.random_normal(shape=(1)), "args4": nd.random_normal(shape=(1)), |
| "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| preloaded_multi_sgd_mom_res = run_performance_test( |
| [getattr(MX_OP_MODULE, "preloaded_multi_sgd_mom_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), |
| "args1": nd.random_normal(shape=arg_shape), "args2": nd.random_normal(shape=arg_shape), |
| "args3": nd.random_normal(shape=(1)), "args4": nd.random_normal(shape=(1)), |
| "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| preloaded_multi_sgd_res = run_performance_test( |
| [getattr(MX_OP_MODULE, "preloaded_multi_sgd_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), "args1": nd.random_normal(shape=arg_shape), |
| "args4": nd.random_normal(shape=(1)), "args5": nd.random_normal(shape=(1)), |
| "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| preloaded_multi_mp_sgd_mom_res = run_performance_test( |
| [getattr(MX_OP_MODULE, "preloaded_multi_mp_sgd_mom_update")], |
| inputs=[{"args0": nd.random_normal(shape=arg_shape), "args1": nd.random_normal(shape=arg_shape), |
| "args2": nd.random_normal(shape=arg_shape), "args3": nd.random_normal(shape=arg_shape), |
| "args4": nd.random_normal(shape=(1)), "args5": nd.random_normal(shape=(1)), |
| "out": nd.random_normal(shape=arg_shape)}], run_backward=False) |
| |
| # Fetch remaining optimizer operators |
| mx_optimizer_ops = get_all_optimizer_operators() |
| |
| # Run benchmarks |
| mx_optimizer_op_results = run_op_benchmarks(mx_optimizer_ops, dtype, ctx, profiler, int64_tensor, warmup, runs) |
| return merge_map_list(multi_sgd_mom_res + multi_sgd_mom_res + multi_sgd_res + multi_mp_sgd_res + preloaded_multi_mp_sgd_res +\ |
| preloaded_multi_sgd_mom_res + preloaded_multi_mp_sgd_res + preloaded_multi_mp_sgd_mom_res +\ |
| multi_mp_sgd_mom_res + preloaded_multi_sgd_res + [mx_optimizer_op_results]) |