tests/python/unittest/test_gluon.py - mxnet - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.

 import os
 import tempfile

 import mxnet as mx
 from mxnet import gluon
 from mxnet.gluon import nn
 from mxnet.base import py_str
 from mxnet.test_utils import assert_almost_equal
 from mxnet.ndarray.ndarray import _STORAGE_TYPE_STR_TO_ID
 from common import (setup_module, with_seed, assertRaises, teardown,
                     assert_raises_cudnn_not_satisfied)
 import numpy as np
 from numpy.testing import assert_array_equal
 from nose.tools import raises, assert_raises
 from copy import deepcopy
 import warnings
 import json
 import unittest
 import random

 @with_seed()
 def test_parameter():
     p = gluon.Parameter('weight', shape=(10, 10))
     p.initialize(init='xavier', ctx=[mx.cpu(0), mx.cpu(1)])
     assert len(p.list_data()) == 2
     assert len(p.list_grad()) == 2
     assert p.data(mx.cpu(1)).context == mx.cpu(1)
     assert p.data(mx.cpu(0)).shape == (10, 10)
     assert p.var().name == 'weight'
     assert p.grad(mx.cpu(0)).stype == 'default'
     assert p.data(mx.cpu(0)).stype == 'default'

     p.reset_ctx(ctx=[mx.cpu(1), mx.cpu(2)])
     assert p.list_ctx() == [mx.cpu(1), mx.cpu(2)]

 @with_seed()
 @raises(AssertionError)
 def test_invalid_parameter_stype():
     p = gluon.Parameter('weight', shape=(10, 10), stype='invalid')

 @with_seed()
 @raises(AssertionError)
 def test_invalid_parameter_grad_stype():
     p = gluon.Parameter('weight', shape=(10, 10), grad_stype='invalid')

 @with_seed()
 def test_sparse_parameter():
     p = gluon.Parameter('weight', shape=(10, 10), stype='row_sparse', grad_stype='row_sparse')
     p.initialize(init='xavier', ctx=[mx.cpu(0), mx.cpu(1)])
     row_id = mx.nd.arange(0, 10, ctx=mx.cpu(1))
     assert len(p.list_grad()) == 2
     # getting row_sparse data without trainer throws an exception
     assertRaises(RuntimeError, p.list_row_sparse_data, row_id)
     trainer = mx.gluon.Trainer([p], 'sgd')
     assert len(p.list_row_sparse_data(row_id)) == 2
     weight = p.row_sparse_data(row_id)
     assert weight.context == mx.cpu(1)
     assert weight.shape == (10, 10)
     assert weight.stype == 'row_sparse'
     assert p.var().name == 'weight'
     assert p.var().attr('__storage_type__') == str(_STORAGE_TYPE_STR_TO_ID['row_sparse'])
     assert p.grad(mx.cpu(0)).stype == 'row_sparse'

     p.reset_ctx(ctx=[mx.cpu(1), mx.cpu(2)])
     assert p.list_ctx() == [mx.cpu(1), mx.cpu(2)]

 @with_seed()
 def test_parameter_invalid_access():
     # cannot call data on row_sparse parameters
     p0 = gluon.Parameter('weight', shape=(10, 10), stype='row_sparse', grad_stype='row_sparse')
     p0.initialize(init='xavier', ctx=[mx.cpu(0), mx.cpu(1)])
     assertRaises(RuntimeError, p0.data)
     assertRaises(RuntimeError, p0.list_data)
     row_id = mx.nd.arange(0, 10)
     # cannot call row_sparse_data on dense parameters
     p1 = gluon.Parameter('weight', shape=(10, 10))
     p1.initialize(init='xavier', ctx=[mx.cpu(0), mx.cpu(1)])
     assertRaises(RuntimeError, p1.row_sparse_data, row_id.copyto(mx.cpu(0)))
     assertRaises(RuntimeError, p1.list_row_sparse_data, row_id)

 @with_seed()
 def test_parameter_dict():
     ctx = mx.cpu(1)
     params0 = gluon.ParameterDict('net_')
     params0.get('w0', shape=(10, 10))
     params0.get('w1', shape=(10, 10), stype='row_sparse')
     all_row_ids = mx.nd.arange(0, 10, ctx=ctx)
     # check param names
     assert list(params0.keys()) == ['net_w0', 'net_w1']
     params0.initialize(ctx=ctx)
     trainer0 = mx.gluon.Trainer(params0, 'sgd')
     prev_w0 = params0.get('w0').data(ctx)
     prev_w1 = params0.get('w1').row_sparse_data(all_row_ids)
     # save params
     params0.save('test_parameter_dict.params')

     # load params
     params1 = gluon.ParameterDict('net_')
     params1.get('w0', shape=(10, 10))
     params1.get('w1', shape=(10, 10), stype='row_sparse')
     params1.load('test_parameter_dict.params', ctx)
     trainer1 = mx.gluon.Trainer(params1, 'sgd')

     # compare the values before and after save/load
     cur_w0 = params1.get('w0').data(ctx)
     cur_w1 = params1.get('w1').row_sparse_data(all_row_ids)
     mx.test_utils.assert_almost_equal(prev_w0.asnumpy(), cur_w0.asnumpy())
     mx.test_utils.assert_almost_equal(prev_w1.asnumpy(), cur_w1.asnumpy())

     # create a new param dict with dense params, and load from the checkpoint
     # of sparse & dense params
     params2 = gluon.ParameterDict('net_')
     params2.get('w0', shape=(10, 10))
     params2.get('w1', shape=(10, 10))
     params2.load('test_parameter_dict.params', ctx)

     # compare the values before and after save/load
     cur_w0 = params2.get('w0').data(ctx)
     cur_w1 = params2.get('w1').data(ctx)
     mx.test_utils.assert_almost_equal(prev_w0.asnumpy(), cur_w0.asnumpy())
     mx.test_utils.assert_almost_equal(prev_w1.asnumpy(), cur_w1.asnumpy())

     # test reset_ctx
     params3 = gluon.ParameterDict('net_')
     params3.get('w0', shape=(10, 10))
     params3.get('w1', shape=(10, 10))
     params3.initialize(ctx=ctx)
     list_contexts = [mx.cpu(42), mx.cpu(24)]
     params3.reset_ctx(list_contexts)
     for p in params3.values():
         assert set(p.list_ctx()) == set(list_contexts)

     # and test list_ctx
     assert set(params3.list_ctx()) == set(list_contexts)


     # test the dtype casting functionality
     params0 = gluon.ParameterDict('')
     params0.get('w0', shape=(10, 10), dtype='float32')
     params0.get('w1', shape=(10, 10), dtype='int8')
     params0.initialize(mx.init.One(), ctx=ctx)
     params0.save('test_parameter_dict.params')

     params1 = gluon.ParameterDict('')
     params1.get('w0', shape=(10, 10), dtype='float16')
     params1.get('w1', shape=(10, 10), dtype='float64')
     params1.load('test_parameter_dict.params', cast_dtype=True, dtype_source='current')
     assert params1['w0'].data().dtype == np.float16
     assert params1['w1'].data().dtype == np.float64
     params1.load('test_parameter_dict.params', cast_dtype=True, dtype_source='saved')
     assert params1['w0'].data().dtype == np.float32
     assert params1['w1'].data().dtype == np.int8


 @with_seed()
 def test_parameter_row_sparse_data():
     ctx0 = mx.cpu(1)
     ctx1 = mx.cpu(2)
     dim0 = 4
     x = gluon.Parameter('x', shape=(dim0, 2), stype='row_sparse')
     x.initialize(init='xavier', ctx=[ctx0, ctx1])
     trainer = gluon.Trainer([x], 'sgd')
     x_param = x._data[0].copy()
     assert x_param.stype == 'row_sparse'
     row_id_0 = mx.nd.array([0,1], ctx=ctx0)
     retained_0 = x.row_sparse_data(row_id_0)
     retained_target_0 = mx.nd.sparse.retain(x_param, row_id_0.as_in_context(ctx0))
     mx.test_utils.assert_almost_equal(retained_0.asnumpy(), retained_target_0.asnumpy())
     assert retained_0.context == ctx0
     row_id_1 = mx.nd.arange(0, dim0, ctx=ctx1)
     retained_1 = x.row_sparse_data(row_id_1)
     retained_target_1 = x_param
     mx.test_utils.assert_almost_equal(retained_1.asnumpy(), retained_target_1.asnumpy())
     assert retained_1.context == ctx1
     row_id_2 = mx.nd.array([0,1,2])
     retained_2 = x.list_row_sparse_data(row_id_2)
     retained_target_2 = mx.nd.sparse.retain(x_param, row_id_2.as_in_context(ctx0))
     mx.test_utils.assert_almost_equal(retained_2[0].asnumpy(), retained_target_2.asnumpy())


 @with_seed()
 def test_constant():
     class Test(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Test, self).__init__(**kwargs)
             self.value = np.asarray([[1,2], [3,4]])
             self.const = self.params.get_constant('const', self.value)

         def hybrid_forward(self, F, x, const):
             return x + const

     test = Test()
     test.initialize()
     trainer = gluon.Trainer(test.collect_params(), 'sgd',
                             {'learning_rate': 1.0, 'momentum': 0.5})

     with mx.autograd.record():
         x = mx.nd.ones((2,2))
         x.attach_grad()
         y = test(x)
         y.backward()

     trainer.step(1)

     assert (test.const.data().asnumpy() == test.value).all()
     assert (x.grad.asnumpy() == 1).all()


 @with_seed()
 def test_parameter_sharing():
     class Net(gluon.Block):
         def __init__(self, in_units=0, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.dense0 = nn.Dense(5, in_units=in_units)
                 self.dense1 = nn.Dense(5, in_units=in_units)

         def forward(self, x):
             return self.dense1(self.dense0(x))

     net1 = Net(prefix='net1_', in_units=5)
     net2 = Net(prefix='net2_', params=net1.collect_params())
     net1.collect_params().initialize()
     net2(mx.nd.zeros((3, 5)))

     net1.save_parameters('net1.params')

     net3 = Net(prefix='net3_')
     net3.load_parameters('net1.params', mx.cpu())

     net4 = Net(prefix='net4_')
     net5 = Net(prefix='net5_', in_units=5, params=net4.collect_params())
     net4.collect_params().initialize()
     net5(mx.nd.zeros((3, 5)))

     net4.save_parameters('net4.params')

     net6 = Net(prefix='net6_')
     net6.load_parameters('net4.params', mx.cpu())


 @with_seed()
 def test_parameter_str():
     class Net(gluon.Block):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.dense0 = nn.Dense(10, in_units=5, use_bias=False)

     net = Net(prefix='net1_')
     lines = str(net.collect_params()).splitlines()

     assert lines[0] == 'net1_ ('
     assert 'net1_dense0_weight' in lines[1]
     assert '(10, 5)' in lines[1]
     assert 'float32' in lines[1]
     assert lines[2] == ')'


 @with_seed()
 def test_collect_parameters():
     net = nn.HybridSequential(prefix="test_")
     with net.name_scope():
         net.add(nn.Conv2D(10, 3))
         net.add(nn.Dense(10, activation='relu'))
     assert set(net.collect_params().keys()) == \
         set(['test_conv0_weight', 'test_conv0_bias','test_dense0_weight','test_dense0_bias'])
     assert set(net.collect_params('.*weight').keys()) == \
         set(['test_conv0_weight', 'test_dense0_weight'])
     assert set(net.collect_params('test_conv0_bias|test_dense0_bias').keys()) == \
         set(['test_conv0_bias', 'test_dense0_bias'])

 @with_seed()
 def test_basic():
     model = nn.Sequential()
     model.add(nn.Dense(128, activation='tanh', in_units=10, flatten=False))
     model.add(nn.Dropout(0.5))
     model.add(nn.Dense(64, activation='tanh', in_units=256),
               nn.Dense(32, in_units=64))
     model.add(nn.Activation('relu'))

     # symbol
     x = mx.sym.var('data')
     y = model(x)
     assert len(y.list_arguments()) == 7

     # ndarray
     model.collect_params().initialize(mx.init.Xavier(magnitude=2.24))
     x = model(mx.nd.zeros((32, 2, 10)))
     assert x.shape == (32, 32)
     x.wait_to_read()

     model.collect_params().setattr('grad_req', 'null')
     assert list(model.collect_params().values())[0]._grad is None
     model.collect_params().setattr('grad_req', 'write')
     assert list(model.collect_params().values())[0]._grad is not None


 @with_seed()
 def test_dense():
     model = nn.Dense(128, activation='tanh', in_units=10, flatten=False, prefix='test_')
     inputs = mx.sym.Variable('data')
     outputs = model(inputs)
     assert set(model.collect_params().keys()) == set(['test_weight', 'test_bias'])
     assert outputs.list_outputs() == ['test_tanh_fwd_output']
     args, outs, auxs = outputs.infer_shape(data=(2, 3, 10))
     assert outs == [(2, 3, 128)]

     model = nn.Dense(128, activation='relu', in_units=30, flatten=True, prefix='test2_')
     inputs = mx.sym.Variable('data')
     outputs = model(inputs)
     assert set(model.collect_params().keys()) == set(['test2_weight', 'test2_bias'])
     assert outputs.list_outputs() == ['test2_relu_fwd_output']
     args, outs, auxs = outputs.infer_shape(data=(17, 2, 5, 3))
     assert outs == [(17, 128)]


 @with_seed()
 def test_symbol_block():
     model = nn.HybridSequential()
     model.add(nn.Dense(128, activation='tanh'))
     model.add(nn.Dropout(0.5))
     model.add(nn.Dense(64, activation='tanh'),
               nn.Dense(32, in_units=64))
     model.add(nn.Activation('relu'))

     model.initialize()

     inputs = mx.sym.var('data')
     outputs = model(inputs).get_internals()

     smodel = gluon.SymbolBlock(outputs, inputs, params=model.collect_params())

     assert len(smodel(mx.nd.zeros((16, 10)))) == 14

     out = smodel(mx.sym.var('in'))
     assert len(out) == len(outputs.list_outputs())

     class Net(nn.HybridBlock):
         def __init__(self, model):
             super(Net, self).__init__()
             self.model = model

         def hybrid_forward(self, F, x):
             out = self.model(x)
             return F.add_n(*[i.sum() for i in out])

     net = Net(smodel)
     net.hybridize()
     assert isinstance(net(mx.nd.zeros((16, 10))), mx.nd.NDArray)

     inputs = mx.sym.var('data')
     outputs = model(inputs)
     smodel = gluon.SymbolBlock(outputs, inputs, params=model.collect_params())
     net = Net(smodel)
     net.hybridize()
     assert isinstance(net(mx.nd.zeros((16, 10))), mx.nd.NDArray)

     # Test case to verify if initializing the SymbolBlock from a model with params
     # other than fp32 param dtype.

     # 1. Load a resnet model, cast it to fp64 and export
     tmp = tempfile.mkdtemp()
     tmpfile = os.path.join(tmp, 'resnet34_fp64')
     ctx = mx.cpu(0)

     net_fp32 = mx.gluon.model_zoo.vision.resnet34_v2(pretrained=True, ctx=ctx, root=tmp)
     net_fp32.cast('float64')
     net_fp32.hybridize()
     data = mx.nd.zeros((1,3,224,224), dtype='float64', ctx=ctx)
     net_fp32.forward(data)
     net_fp32.export(tmpfile, 0)

     # 2.a Load the saved model and verify if all the params are loaded correctly.
     # and choose one of the param to verify the type if fp64.\
     sym_file = tmpfile + '-symbol.json'
     params_file = tmpfile + '-0000.params'
     sm = mx.sym.load(sym_file)
     inputs = mx.sym.var('data', dtype='float64')
     net_fp64 = mx.gluon.SymbolBlock(sm, inputs)
     net_fp64.collect_params().load(params_file, ctx=ctx)
     # Get a conv layer's weight parameter name. Conv layer's weight param is
     # expected to be of dtype casted, fp64.
     for param_name in net_fp64.params.keys():
         if 'conv' in param_name and 'weight' in param_name:
             break
     assert np.dtype(net_fp64.params[param_name].dtype) == np.dtype(np.float64)

     # 3.b Verify same functionnality with the imports API
     net_fp_64 = mx.gluon.SymbolBlock.imports(sym_file, 'data', params_file, ctx=ctx)

     # Get a conv layer's weight parameter name. Conv layer's weight param is
     # expected to be of dtype casted, fp64.
     for param_name in net_fp_64.params.keys():
         if 'conv' in param_name and 'weight' in param_name:
             break
     assert np.dtype(net_fp_64.params[param_name].dtype) == np.dtype(np.float64)

     # Cast the symbol block to FP32 and try to forward a FP32 data.
     # This will verify SymbolBlock.cast() functionality.
     net_fp64.cast('float32')
     fp32_data = mx.nd.zeros((1,3,224,224), dtype='float32', ctx=ctx)
     prediction = net_fp64.forward(fp32_data)
     assert np.dtype(prediction.dtype) == np.dtype(np.float32)

 @with_seed()
 @raises(AssertionError)
 def test_sparse_symbol_block():
     data = mx.sym.var('data')
     weight = mx.sym.var('weight', stype='row_sparse')
     bias = mx.sym.var('bias')
     out = mx.sym.broadcast_add(mx.sym.dot(data, weight), bias)
     # an exception is expected when creating a SparseBlock w/ sparse param
     net = gluon.SymbolBlock(out, data)

 @with_seed()
 @raises(RuntimeError)
 def test_sparse_hybrid_block():
     params = gluon.ParameterDict('net_')
     params.get('weight', shape=(5,5), stype='row_sparse', dtype='float32')
     params.get('bias', shape=(5), dtype='float32')
     net = gluon.nn.Dense(5, params=params)
     net.initialize()
     x = mx.nd.ones((2,5))
     # an exception is expected when forwarding a HybridBlock w/ sparse param
     y = net(x)

 @with_seed()
 def test_hybrid_block_none_args():
     class Foo(gluon.HybridBlock):
         def hybrid_forward(self, F, a, b):
             if a is None and b is not None:
                 return b
             elif b is None and a is not None:
                 return a
             elif a is not None and b is not None:
                 return a + b
             else:
                 raise NotImplementedError

     class FooDefault(gluon.HybridBlock):
         def hybrid_forward(self, F, a, b=None):
             if a is None and b is not None:
                 return b
             elif b is None and a is not None:
                 return a
             elif a is not None and b is not None:
                 return a + b
             else:
                 raise NotImplementedError


     class FooNested(gluon.HybridBlock):
         def __init__(self, prefix=None, params=None):
             super(FooNested, self).__init__(prefix=prefix, params=params)
             self.f1 = Foo(prefix='foo1')
             self.f2 = Foo(prefix='foo2')
             self.f3 = Foo(prefix='foo3')

         def hybrid_forward(self, F, a, b):
             data = self.f1(a, b)
             data = self.f2(a, data)
             data = self.f3(data, b)
             return data

     for arg_inputs in [(None, mx.nd.ones((10,))),
                        (mx.nd.ones((10,)), mx.nd.ones((10,))),
                        (mx.nd.ones((10,)), None)]:
         foo1 = FooNested(prefix='foo_nested_hybridized')
         foo1.hybridize()
         foo2 = FooNested(prefix='foo_nested_nohybrid')
         for _ in range(2): # Loop for 2 times to trigger forwarding of the cached version
             out1 = foo1(*arg_inputs)
             out2 = foo2(*arg_inputs)
             if isinstance(out1, tuple):
                 for lhs, rhs in zip(out1, out2):
                     assert_almost_equal(lhs.asnumpy(), rhs.asnumpy())
             else:
                 assert_almost_equal(out1.asnumpy(), out2.asnumpy())
     for do_hybridize in [True, False]:
         foo = FooNested()
         if do_hybridize:
             foo.hybridize()
         assert_raises(ValueError, foo, None, None)

     # Make sure the ValueError is correctly raised
     foo = FooNested()
     foo.hybridize()
     foo(None, mx.nd.ones((10,)))  # Pass for the first time to initialize the cached op
     assert_raises(ValueError, lambda: foo(mx.nd.ones((10,)), mx.nd.ones((10,))))
     foo = FooNested()
     assert_raises(ValueError, lambda: foo(mx.nd.ones((10,)), mx.sym.var('a')))
     foo = FooNested()
     assert_raises(ValueError, lambda: foo(mx.sym.var('a'), mx.nd.ones((10,))))

     # Test the case of the default values
     foo1 = FooDefault()
     foo1.hybridize()
     foo2 = FooDefault()
     out1 = foo1(mx.nd.ones((10,)))
     out2 = foo2(mx.nd.ones((10,)))
     out3 = foo1(mx.nd.ones((10,)), None)
     out4 = foo2(mx.nd.ones((10,)), None)
     assert_almost_equal(out1.asnumpy(), out2.asnumpy())
     assert_almost_equal(out1.asnumpy(), out3.asnumpy())
     assert_almost_equal(out1.asnumpy(), out4.asnumpy())
     foo1 = FooDefault()
     foo1.hybridize()
     out1 = foo1(mx.nd.ones((10,)), None)
     out2 = foo1(mx.nd.ones((10,)))
     assert_almost_equal(out1.asnumpy(), out2.asnumpy())
     assert_raises(ValueError, lambda: foo1(mx.nd.ones((10,)), mx.nd.ones((10,))))


 @with_seed()
 def check_layer_forward(layer, dshape):
     print("checking layer {}\nshape: {}.".format(layer, dshape))
     layer.collect_params().initialize()
     x = mx.nd.ones(shape=dshape)
     x.attach_grad()
     with mx.autograd.record():
         out = layer(x)
     out.backward()

     np_out = out.asnumpy()
     np_dx = x.grad.asnumpy()

     layer.hybridize()

     x = mx.nd.ones(shape=dshape)
     x.attach_grad()
     with mx.autograd.record():
         out = layer(x)
     out.backward()

     mx.test_utils.assert_almost_equal(np_out, out.asnumpy(), rtol=1e-5, atol=1e-6)
     mx.test_utils.assert_almost_equal(np_dx, x.grad.asnumpy(), rtol=1e-5, atol=1e-6)

 @with_seed()
 def test_conv():
     layers1d = [
         nn.Conv1D(16, 3, in_channels=4),
         nn.Conv1D(16, 3, groups=2, in_channels=4),
         nn.Conv1D(16, 3, strides=3, groups=2, in_channels=4),
         ]
     for layer in layers1d:
         check_layer_forward(layer, (1, 4, 10))


     layers2d = [
         nn.Conv2D(16, (3, 4), in_channels=4),
         nn.Conv2D(16, (5, 4), in_channels=4),
         nn.Conv2D(16, (3, 4), groups=2, in_channels=4),
         nn.Conv2D(16, (3, 4), strides=4, in_channels=4),
         nn.Conv2D(16, (3, 4), dilation=4, in_channels=4),
         nn.Conv2D(16, (3, 4), padding=4, in_channels=4),
         ]
     for layer in layers2d:
         check_layer_forward(layer, (1, 4, 20, 20))


     layers3d = [
         nn.Conv3D(16, (1, 8, 4), in_channels=4, activation='relu'),
         nn.Conv3D(16, (5, 4, 3), in_channels=4),
         nn.Conv3D(16, (3, 3, 3), groups=2, in_channels=4),
         nn.Conv3D(16, 4, strides=4, in_channels=4),
         nn.Conv3D(16, (3, 3, 3), padding=4, in_channels=4),
         ]
     for layer in layers3d:
         check_layer_forward(layer, (1, 4, 10, 10, 10))


     layer = nn.Conv2D(16, (3, 3), layout='NHWC', in_channels=4)
     # check_layer_forward(layer, (1, 10, 10, 4))

     layer = nn.Conv3D(16, (3, 3, 3), layout='NDHWC', in_channels=4)
     # check_layer_forward(layer, (1, 10, 10, 10, 4))


 @with_seed()
 def test_deconv():
     # layers1d = [
     #     nn.Conv1DTranspose(16, 3, in_channels=4),
     #     nn.Conv1DTranspose(16, 3, groups=2, in_channels=4),
     #     nn.Conv1DTranspose(16, 3, strides=3, groups=2, in_channels=4),
     #     ]
     # for layer in layers1d:
     #     check_layer_forward(layer, (1, 4, 10))


     layers2d = [
         nn.Conv2DTranspose(16, (3, 4), in_channels=4),
         nn.Conv2DTranspose(16, (5, 4), in_channels=4),
         nn.Conv2DTranspose(16, (3, 4), groups=2, in_channels=4),
         nn.Conv2DTranspose(16, (3, 4), strides=4, in_channels=4),
         nn.Conv2DTranspose(16, (3, 4), dilation=4, in_channels=4),
     #   nn.Conv2DTranspose(16, (3, 4), padding=4, in_channels=4),
         nn.Conv2DTranspose(16, (3, 4), strides=4, output_padding=3, in_channels=4),
         ]
     for layer in layers2d:
         check_layer_forward(layer, (1, 4, 20, 20))


     # layers3d = [
     #     nn.Conv3DTranspose(16, (1, 8, 4), in_channels=4),
     #     nn.Conv3DTranspose(16, (5, 4, 3), in_channels=4),
     #     nn.Conv3DTranspose(16, (3, 3, 3), groups=2, in_channels=4),
     #     nn.Conv3DTranspose(16, 4, strides=4, in_channels=4),
     #     nn.Conv3DTranspose(16, (3, 3, 3), padding=4, in_channels=4),
     #     ]
     # for layer in layers3d:
     #     check_layer_forward(layer, (1, 4, 10, 10, 10))
     #
     #
     # layer = nn.Conv2DTranspose(16, (3, 3), layout='NHWC', in_channels=4)
     # # check_layer_forward(layer, (1, 10, 10, 4))
     #
     # layer = nn.Conv3DTranspose(16, (3, 3, 3), layout='NDHWC', in_channels=4)
     # # check_layer_forward(layer, (1, 10, 10, 10, 4))


 @with_seed()
 def test_pool():
     # transpose shape to bring feature dimension 'c' from 2nd position to last
     def transpose(shape):
         return (shape[0],) + shape[2:] + (shape[1],)

     for layout in ['NCW', 'NWC']:
         shape1d = (1, 2, 10)
         if layout == 'NWC':
             shape1d = transpose(shape1d)
         layers1d = [
             nn.MaxPool1D(layout=layout),
             nn.MaxPool1D(3, layout=layout),
             nn.MaxPool1D(3, 2, layout=layout),
             nn.AvgPool1D(layout=layout),
             nn.AvgPool1D(count_include_pad=False, layout=layout),
             nn.GlobalAvgPool1D(layout=layout),
             ]
         for layer in layers1d:
             check_layer_forward(layer, shape1d)


     for layout in ['NCHW', 'NHWC']:
         shape2d = (1, 2, 10, 10)
         if layout == 'NHWC':
             shape2d = transpose(shape2d)
         layers2d = [
             nn.MaxPool2D(layout=layout),
             nn.MaxPool2D((3, 3), layout=layout),
             nn.MaxPool2D(3, 2, layout=layout),
             nn.AvgPool2D(layout=layout),
             nn.AvgPool2D(count_include_pad=False, layout=layout),
             nn.GlobalAvgPool2D(layout=layout),
             ]
         for layer in layers2d:
             check_layer_forward(layer, shape2d)

     for layout in ['NCDHW', 'NDHWC']:
         shape3d = (1, 2, 10, 10, 10)
         if layout == 'NDHWC':
             shape3d = transpose(shape3d)
         layers3d = [
             nn.MaxPool3D(layout=layout),
             nn.MaxPool3D((3, 3, 3), layout=layout),
             nn.MaxPool3D(3, 2, layout=layout),
             nn.AvgPool3D(layout=layout),
             nn.AvgPool3D(count_include_pad=False, layout=layout),
             nn.GlobalAvgPool3D(layout=layout),
             ]
         for layer in layers3d:
             check_layer_forward(layer, shape3d)

     # test ceil_mode
     for layout in ['NCHW', 'NHWC']:
         xshape = (2, 2, 10, 10)
         noceil_out_shape = (2, 2, 3, 3)
         ceil_out_shape = (2, 2, 4, 4)
         if layout == 'NHWC':
             xshape = transpose(xshape)
             noceil_out_shape = transpose(noceil_out_shape)
             ceil_out_shape = transpose(ceil_out_shape)

         x = mx.nd.zeros(xshape)

         layer = nn.MaxPool2D(3, ceil_mode=False, layout=layout)
         layer.collect_params().initialize()
         assert (layer(x).shape==noceil_out_shape)

         layer = nn.MaxPool2D(3, ceil_mode=True, layout=layout)
         layer.collect_params().initialize()
         assert (layer(x).shape==ceil_out_shape)


 @with_seed()
 def test_batchnorm():
     layer = nn.BatchNorm(in_channels=10)
     check_layer_forward(layer, (2, 10, 10, 10))


 @with_seed()
 def test_sync_batchnorm():
     def _check_batchnorm_result(input, num_devices=1, cuda=False):
         from mxnet.gluon.utils import split_and_load

         def _find_bn(module):
             if isinstance(module, (mx.gluon.nn.BatchNorm, mx.gluon.contrib.nn.SyncBatchNorm)):
                 return module
             elif isinstance(module.module, (mx.gluon.nn.BatchNorm, mx.gluon.contrib.nn.SyncBatchNorm)):
                 return module.module

             raise RuntimeError('BN not found')

         def _syncParameters(bn1, bn2, ctx):
             ctx = input.context
             bn2.gamma.set_data(bn1.gamma.data(ctx))
             bn2.beta.set_data(bn1.beta.data(ctx))
             bn2.running_mean.set_data(bn1.running_mean.data(ctx))
             bn2.running_var.set_data(bn1.running_var.data(ctx))

         input1 = input.copy()
         input2 = input.copy()

         if cuda:
             input1 = input.as_in_context(mx.gpu(0))
             ctx_list = [mx.gpu(i) for i in range(num_devices)]
         else:
             ctx_list = [mx.cpu(0) for _ in range(num_devices)]

         nch = input.shape[1] if input.ndim > 1 else 1
         bn1 = mx.gluon.nn.BatchNorm(in_channels=nch)
         bn2 = mx.gluon.contrib.nn.SyncBatchNorm(
             in_channels=nch, num_devices=num_devices)

         bn1.initialize(ctx=ctx_list[0])
         bn2.initialize(ctx=ctx_list)

         # using the same values for gamma and beta
         #_syncParameters(_find_bn(bn1), _find_bn(bn2), ctx_list[0])

         input1.attach_grad()
         inputs2 = split_and_load(input2, ctx_list, batch_axis=0)
         for xi in inputs2:
             xi.attach_grad()

         with mx.autograd.record():
             output1 = bn1(input1)
             output2 = [bn2(xi) for xi in inputs2]
             loss1 = (output1 ** 2).sum()
             loss2 = [(output ** 2).sum() for output in output2]
             mx.autograd.backward(loss1)
             mx.autograd.backward(loss2)

         output2 = mx.nd.concat(*[output.as_in_context(input.context)
                                  for output in output2], dim=0)
         # check bn1

         momentum = 0.9
         epsilon = 1e-5
         axis = 1
         data = input1
         running_mean = mx.nd.zeros(nch, ctx=data.context)
         running_var = mx.nd.ones(nch, ctx=data.context)

         data_mean = data.mean(
             axis=axis, exclude=True, keepdims=True)
         data_var = (data - data_mean).square().mean(axis=axis,
                                                     exclude=True, keepdims=True)

         target_output = (data - data_mean) / (data_var + epsilon).sqrt()

         # squeeze data_mean and data_var
         data_mean_flat = data_mean.squeeze()
         data_var_flat = data_var.squeeze()

         running_mean = running_mean * momentum + \
             data_mean_flat * (1 - momentum)
         running_var = running_var * momentum + \
             data_var_flat * (1 - momentum)

         atol = 1e-2
         rtol = 1e-2
         assert_almost_equal(output1.asnumpy(), target_output.asnumpy(),
                             atol=atol, rtol=rtol)
         assert_almost_equal(_find_bn(bn1).running_mean.data(ctx_list[0]).asnumpy(),
                             running_mean.asnumpy(),
                             atol=atol, rtol=rtol)
         assert_almost_equal(_find_bn(bn1).running_var.data(ctx_list[0]).asnumpy(),
                             running_var.asnumpy(),
                             atol=atol, rtol=rtol)
         # assert forwarding
         assert_almost_equal(input1.asnumpy(), input2.asnumpy(),
                             atol=atol, rtol=rtol)
         assert_almost_equal(output1.asnumpy(),
                             output2.asnumpy(), atol=atol, rtol=rtol)
         assert_almost_equal(_find_bn(bn1).running_mean.data(ctx_list[0]).asnumpy(),
                             _find_bn(bn2).running_mean.data(ctx_list[0]).asnumpy(),
                             atol=atol, rtol=rtol)
         assert_almost_equal(_find_bn(bn1).running_var.data(ctx_list[0]).asnumpy(),
                             _find_bn(bn2).running_var.data(ctx_list[0]).asnumpy(),
                             atol=atol, rtol=rtol)
         input2grad = mx.nd.concat(
             *[output.grad.as_in_context(input.context) for output in inputs2], dim=0)
         assert_almost_equal(input1.grad.asnumpy(),
                             input2grad.asnumpy(), atol=atol, rtol=rtol)

     cfgs = [(1, False)]
     num_gpus = mx.context.num_gpus()
     for i in range(1, num_gpus + 1):
         cfgs.append((i, True))
     for ndev, cuda in cfgs:
         # check with unsync version
         for shape in [(24, 2), (24, 3, 4), (24, 4, 4, 4), (24, 5, 6, 4, 4)]:
             print(str((ndev, cuda, shape)))
             for i in range(10):
                 _check_batchnorm_result(mx.nd.random.uniform(shape=shape,
                                                              ctx=mx.cpu(0)),
                                         num_devices=ndev, cuda=cuda)


 @with_seed()
 def test_instancenorm():
     layer = nn.InstanceNorm(in_channels=10)
     check_layer_forward(layer, (2, 10, 10, 10))

 @with_seed()
 def test_layernorm():
     layer = nn.LayerNorm(in_channels=10)
     check_layer_forward(layer, (2, 10, 10, 10))


 @with_seed()
 def test_groupnorm():
     layer = nn.GroupNorm()
     check_layer_forward(layer, (2, 10, 10, 10))
     layer = nn.GroupNorm(num_groups=2)
     check_layer_forward(layer, (2, 10, 10, 10))
     layer = nn.GroupNorm(num_groups=5)
     check_layer_forward(layer, (2, 10, 10, 10))

 @with_seed()
 def test_reflectionpad():
     layer = nn.ReflectionPad2D(3)
     check_layer_forward(layer, (2, 3, 24, 24))


 @with_seed()
 def test_reshape():
     x = mx.nd.ones((2, 4, 10, 10))
     layer = nn.Conv2D(10, 2, in_channels=4)
     layer.collect_params().initialize()
     with mx.autograd.record():
         x = layer(x)
         x = x.reshape((-1,))
         x = x + 10
     x.backward()


 @with_seed()
 def test_slice():
     x = mx.nd.ones((5, 4, 10, 10))
     layer = nn.Conv2D(10, 2, in_channels=4)
     layer.collect_params().initialize()
     with mx.autograd.record():
         x = layer(x)
         x = x[1:3]
         x = x + 10
     x.backward()


 @with_seed()
 def test_at():
     x = mx.nd.ones((5, 4, 10, 10))
     layer = nn.Conv2D(10, 2, in_channels=4)
     layer.collect_params().initialize()
     with mx.autograd.record():
         x = layer(x)
         x = x[1]
         x = x + 10
     x.backward()


 @with_seed()
 def test_deferred_init():
     x = mx.nd.ones((5, 4, 10, 10))
     layer = nn.Conv2D(10, 2)
     layer.collect_params().initialize()
     layer(x)


 def check_split_data(x, num_slice, batch_axis, **kwargs):
     res = gluon.utils.split_data(x, num_slice, batch_axis, **kwargs)
     assert len(res) == num_slice
     mx.test_utils.assert_almost_equal(mx.nd.concat(*res, dim=batch_axis).asnumpy(),
                                       x.asnumpy())


 @with_seed()
 def test_split_data():
     x = mx.nd.random.uniform(shape=(128, 33, 64))

     check_split_data(x, 8, 0)
     check_split_data(x, 3, 1)
     check_split_data(x, 4, 1, even_split=False)
     check_split_data(x, 15, 1, even_split=False)
     try:
         check_split_data(x, 4, 1)
     except ValueError:
         return
     assert False, "Should have failed"


 @with_seed()
 def test_flatten():
     flatten = nn.Flatten()
     x = mx.nd.zeros((3,4,5,6))
     assert flatten(x).shape == (3, 4*5*6)
     x = mx.nd.zeros((3,6))
     assert flatten(x).shape == (3, 6)
     x = mx.nd.zeros((3,))
     assert flatten(x).shape == (3, 1)

 @with_seed()
 def test_block_attr_hidden():
     b = gluon.Block()

     # regular attributes can change types
     b.a = None
     b.a = 1


 @raises(TypeError)
 @with_seed()
 def test_block_attr_block():
     b = gluon.Block()

     # regular variables can't change types
     b.b = gluon.Block()
     b.b = (2,)


 @raises(TypeError)
 @with_seed()
 def test_block_attr_param():
     b = gluon.Block()

     # regular variables can't change types
     b.b = gluon.Parameter()
     b.b = (2,)


 @with_seed()
 def test_block_attr_regular():
     b = gluon.Block()

     # set block attribute also sets _children
     b.c = gluon.Block()
     c2 = gluon.Block()
     b.c = c2
     assert b.c is c2 and list(b._children.values())[0] is c2


 @with_seed()
 def test_block_attr_list_of_block():
     class Model1(gluon.Block):
         def __init__(self, **kwargs):
             super(Model1, self).__init__(**kwargs)
             with self.name_scope():
                 self.layers = [nn.Dense(i * 10) for i in range(6)]

     class Model2(gluon.Block):
         def __init__(self, **kwargs):
             super(Model2, self).__init__(**kwargs)
             with self.name_scope():
                 self.layers = dict()
                 self.layers['a'] = [nn.Dense(10), nn.Dense(10)]

     class Model3(gluon.Block):
         def __init__(self, **kwargs):
             super(Model3, self).__init__(**kwargs)
             with self.name_scope():
                 self.layers = nn.Sequential()
                 self.layers.add(*[nn.Dense(i * 10) for i in range(6)])

     class Model4(gluon.Block):
         def __init__(self, **kwargs):
             super(Model4, self).__init__(**kwargs)
             with self.name_scope():
                 self.data = {'a': '4', 'b': 123}

     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter('always')
         model = Model1()
         model.collect_params()
         assert len(w) > 0
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter('always')
         model = Model2()
         model.collect_params()
         assert len(w) > 0
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter('always')
         model = Model3()
         model.collect_params()
         assert len(w) == 0
     with warnings.catch_warnings(record=True) as w:
         warnings.simplefilter('always')
         model = Model4()
         model.collect_params()
         assert len(w) == 0

 def check_sequential(net):
     dense1 = gluon.nn.Dense(10)
     net.add(dense1)
     dense2 = gluon.nn.Dense(10)
     net.add(dense2)
     dense3 = gluon.nn.Dense(10)
     net.add(dense3)

     assert net[1] is dense2
     assert net[-1] is dense3
     slc = net[1:3]
     assert len(slc) == 2 and slc[0] is dense2 and slc[1] is dense3
     assert isinstance(slc, type(net))

 @with_seed()
 def test_sequential():
     check_sequential(gluon.nn.Sequential())
     check_sequential(gluon.nn.HybridSequential())

 @with_seed()
 def test_sequential_warning():
     with warnings.catch_warnings(record=True) as w:
         # The following line permits the test to pass if run multiple times
         warnings.simplefilter('always')
         b = gluon.nn.Sequential()
         b.add(gluon.nn.Dense(20))
         b.hybridize()
         assert len(w) == 1


 @with_seed()
 def test_global_norm_clip():
     stypes = ['default', 'row_sparse']
     def check_global_norm_clip(stype, check_isfinite):
         x1 = mx.nd.ones((3,3)).tostype(stype)
         x2 = mx.nd.ones((4,4)).tostype(stype)
         norm = gluon.utils.clip_global_norm([x1, x2], 1.0, check_isfinite=check_isfinite)
         assert norm == 5.0
         assert_almost_equal(x1.asnumpy(), np.ones((3,3))/5)
         assert_almost_equal(x2.asnumpy(), np.ones((4,4))/5)

         x3 = mx.nd.array([1.0, 2.0, float('nan')]).tostype(stype)
         with warnings.catch_warnings(record=True) as w:
             warnings.simplefilter("always")
             gluon.utils.clip_global_norm([x1, x3], 2.0, check_isfinite=check_isfinite)
             assert len(w) == check_isfinite

     for stype in stypes:
         for check_isfinite in [True, False]:
             check_global_norm_clip(stype, check_isfinite)

 @with_seed()
 def test_embedding():
     def check_embedding(sparse_grad):
         layer = gluon.nn.Embedding(10, 100, sparse_grad=sparse_grad)
         layer.initialize()
         x = mx.nd.array([3,4,2,0,1])
         with mx.autograd.record():
             y = layer(x)
             y.backward()
         assert (layer.weight.grad().asnumpy()[:5] == 1).all()
         assert (layer.weight.grad().asnumpy()[5:] == 0).all()

     def check_embedding_large_input(sparse_grad):
         embedding = mx.gluon.nn.Embedding(10, 1, sparse_grad=True)
         embedding.initialize()
         embedding.hybridize()
         shape = (20481,)
         with mx.autograd.record():
             emb_in = embedding(mx.nd.ones(shape))
             loss = emb_in.sum()
         loss.backward()
         assert embedding.weight.grad().data.sum().asscalar() == 20481

     check_embedding(True)
     check_embedding(False)
     check_embedding_large_input(True)
     check_embedding_large_input(False)

 @with_seed()
 def test_export():
     ctx = mx.context.current_context()
     model = gluon.model_zoo.vision.resnet18_v1(
         prefix='resnet', ctx=ctx, pretrained=True)
     model.hybridize()
     data = mx.nd.random.normal(shape=(1, 3, 32, 32))
     out = model(data)

     model.export('gluon')

     module = mx.mod.Module.load('gluon', 0, label_names=None, context=ctx)
     module.bind(data_shapes=[('data', data.shape)])
     module.forward(mx.io.DataBatch([data], None), is_train=False)
     mod_out, = module.get_outputs()

     assert_almost_equal(out.asnumpy(), mod_out.asnumpy())

     model2 = gluon.model_zoo.vision.resnet18_v1(prefix='resnet', ctx=ctx)
     model2.collect_params().load('gluon-0000.params', ctx)
     out2 = model2(data)

     assert_almost_equal(out.asnumpy(), out2.asnumpy())

 @with_seed()
 def test_import():
     ctx = mx.context.current_context()
     net1 = gluon.model_zoo.vision.resnet18_v1(
         prefix='resnet', ctx=ctx, pretrained=True)
     net1.hybridize()
     data = mx.nd.random.normal(shape=(1, 3, 32, 32))
     out1 = net1(data)

     net1.export('net1', epoch=1)

     net2 = gluon.SymbolBlock.imports(
         'net1-symbol.json', ['data'], 'net1-0001.params', ctx)
     out2 = net2(data)
     lines = str(net2).splitlines()

     assert_almost_equal(out1.asnumpy(), out2.asnumpy())
     assert lines[0] == 'SymbolBlock('
     assert lines[1]
     assert lines[2] == ')'


 @with_seed()
 def test_hybrid_stale_cache():
     net = mx.gluon.nn.HybridSequential()
     with net.name_scope():
         net.add(mx.gluon.nn.Dense(10, weight_initializer='zeros', bias_initializer='ones', flatten=False))

     net.hybridize()
     net.initialize()
     net(mx.nd.ones((2,3,5)))

     net.add(mx.gluon.nn.Flatten())
     assert net(mx.nd.ones((2,3,5))).shape == (2, 30)

     net = mx.gluon.nn.HybridSequential()
     with net.name_scope():
         net.fc1 = mx.gluon.nn.Dense(10, weight_initializer='zeros',
                                     bias_initializer='ones', flatten=False)
         net.fc2 = mx.gluon.nn.Dense(10, weight_initializer='zeros',
                                     bias_initializer='ones', flatten=False)
     net.hybridize()
     net.initialize()
     net(mx.nd.ones((2,3,5)))

     net.fc2 = mx.gluon.nn.Dense(10, weight_initializer='zeros',
                                 bias_initializer='ones', flatten=True)
     net.initialize()
     assert net(mx.nd.ones((2,3,5))).shape == (2, 10)


 @with_seed()
 def test_lambda():
     net1 = mx.gluon.nn.HybridSequential()
     net1.add(nn.Activation('tanh'),
              nn.LeakyReLU(0.1))

     net2 = mx.gluon.nn.HybridSequential()
     op3 = lambda F, x, *args: F.LeakyReLU(x, *args, slope=0.1)
     net2.add(nn.HybridLambda('tanh'),
              nn.HybridLambda(op3))

     op4 = lambda x: mx.nd.LeakyReLU(x, slope=0.1)
     net3 = mx.gluon.nn.Sequential()
     net3.add(nn.Lambda('tanh'),
              nn.Lambda(op4))

     input_data = mx.nd.random.uniform(shape=(2, 3, 5, 7))
     out1, out2, out3 = net1(input_data), net2(input_data), net3(input_data)
     assert_almost_equal(out1.asnumpy(), out2.asnumpy(), rtol=1e-3, atol=1e-3)
     assert_almost_equal(out1.asnumpy(), out3.asnumpy(), rtol=1e-3, atol=1e-3)


 @with_seed()
 def test_fill_shape_deferred():
     net = nn.HybridSequential()
     with net.name_scope():
         net.add(nn.Conv2D(64, kernel_size=2, padding=1),
                 nn.BatchNorm(),
                 nn.Dense(10))
     net.hybridize()
     net.initialize()
     net(mx.nd.ones((2,3,5,7)))
     assert net[0].weight.shape[1] == 3, net[0].weight.shape[1]
     assert net[1].gamma.shape[0] == 64, net[1].gamma.shape[0]
     assert net[2].weight.shape[1] == 3072, net[2].weight.shape[1]


 @with_seed()
 def test_dtype():
     net = mx.gluon.model_zoo.vision.resnet18_v1()
     net.initialize()
     net.cast('float64')
     with mx.autograd.record():
         y = net(mx.nd.ones((16, 3, 32, 32), dtype='float64'))
         y.backward()

     net = mx.gluon.model_zoo.vision.resnet18_v1()
     net.initialize()
     net.hybridize()
     net(mx.nd.ones((16, 3, 32, 32), dtype='float32'))

     net.cast('float64')
     net(mx.nd.ones((16, 3, 32, 32), dtype='float64'))

     mx.nd.waitall()

     class Net(gluon.Block):
         def __init__(self, in_dim, output_dim):
             super(Net, self).__init__()
             with self.name_scope():
                 self.embed = gluon.nn.Embedding(input_dim=in_dim, output_dim=output_dim,dtype=np.float64)
                 self.dense = gluon.nn.Dense(2, dtype=np.float64)

         def forward(self, x):
             e = self.embed(x)
             assert(e.dtype == np.float64)
             y = self.dense(e)
             assert(y.dtype == np.float64)
             return y

     net = Net(5, 10)
     net.initialize()
     out = net(mx.nd.ones((3,), dtype=np.float64))
     mx.nd.waitall()

 @with_seed()
 def test_fill_shape_load():
     ctx = mx.context.current_context()
     net1 = nn.HybridSequential()
     with net1.name_scope():
         net1.add(nn.Conv2D(64, kernel_size=2, padding=1),
                  nn.BatchNorm(),
                  nn.Dense(10))
     net1.hybridize()
     net1.initialize(ctx=ctx)
     net1(mx.nd.ones((2,3,5,7), ctx))
     net1.save_parameters('net_fill.params')

     net2 = nn.HybridSequential()
     with net2.name_scope():
         net2.add(nn.Conv2D(64, kernel_size=2, padding=1),
                  nn.BatchNorm(),
                  nn.Dense(10))
     net2.hybridize()
     net2.initialize()
     net2.load_parameters('net_fill.params', ctx)
     assert net2[0].weight.shape[1] == 3, net2[0].weight.shape[1]
     assert net2[1].gamma.shape[0] == 64, net2[1].gamma.shape[0]
     assert net2[2].weight.shape[1] == 3072, net2[2].weight.shape[1]


 @with_seed()
 def test_inline():
     net = mx.gluon.nn.HybridSequential()
     with net.name_scope():
         net.add(mx.gluon.nn.Dense(10))
         net.add(mx.gluon.nn.Dense(10))
         net.add(mx.gluon.nn.Dense(10))

     net.initialize()
     net.hybridize(inline_limit=3)
     with mx.autograd.record():
         y = net(mx.nd.zeros((1,10)))

     len_1 = len(json.loads(mx.autograd.get_symbol(y).tojson())['nodes'])
     y.backward()

     net.hybridize(inline_limit=0)
     with mx.autograd.record():
         y = net(mx.nd.zeros((1,10)))

     len_2 = len(json.loads(mx.autograd.get_symbol(y).tojson())['nodes'])
     y.backward()

     assert len_1 == len_2 + 2


 @with_seed()
 def test_activations():
     point_to_validate = mx.nd.array([-0.1, 0.1] * 3)

     swish = mx.gluon.nn.Swish()
     def swish_test(x):
         return x * mx.nd.sigmoid(x)

     for test_point, ref_point in zip(swish_test(point_to_validate), swish(point_to_validate)):
         assert test_point == ref_point

     elu = mx.gluon.nn.ELU()
     def elu_test(x):
         def elu(x):
             return mx.nd.expm1(x) if x <= 0.0 else x
         return [elu(x_i) for x_i in x]

     for test_point, ref_point in zip(elu_test(point_to_validate), elu(point_to_validate)):
         assert_almost_equal(test_point.asnumpy(), ref_point.asnumpy())

     selu = mx.gluon.nn.SELU()
     def selu_test(x):
         def selu(x):
             scale, alpha = 1.0507009873554804934193349852946, 1.6732632423543772848170429916717
             return scale * x if x >= 0 else scale * alpha * mx.nd.expm1(x)
         return [selu(x_i) for x_i in x]

     for test_point, ref_point in zip(selu_test(point_to_validate), selu(point_to_validate)):
         assert test_point == ref_point

     prelu = mx.gluon.nn.PReLU()
     prelu.initialize()
     x = point_to_validate.reshape((1, 3, 2))
     assert_almost_equal(prelu(x).asnumpy(), mx.nd.where(x >= 0, x, 0.25 * x).asnumpy())

     gelu = mx.gluon.nn.GELU()
     def gelu_test(x):
         CUBE_CONSTANT = 0.044715
         ROOT_TWO_OVER_PI = 0.7978845608028654
         def g(x):
             return ROOT_TWO_OVER_PI * (x + CUBE_CONSTANT * x * x * x)
         def f(x):
             return 1.0 + mx.nd.tanh(g(x))
         def gelu(x):
             return 0.5 * x * f(x)
         for test_point, ref_point in zip(gelu_test(point_to_validate), gelu(point_to_validate)):
             assert test_point == ref_point


 @with_seed()
 def test_dropout():
     def get_slice(x, axis, idx):
         ix = ()
         for i in range(x.ndim):
             if i == axis:
                 ix += (idx,)
             else:
                 ix += (slice(None, None, None),)
         return x[ix]

     def check_dropout_axes(ratio, shape, axes):
         compactshape = list(shape)
         for axis in axes:
             compactshape[axis] = 1
         compactx = mx.random.uniform(shape=tuple(compactshape))
         broadcastx = compactx.broadcast_to(shape)
         dropouty = mx.gluon.nn.Dropout(rate=ratio, axes=axes)(broadcastx)
         for axis in axes:
             target = get_slice(dropouty, axis, 0).asnumpy()
             for i in range(1, shape[axis]):
                 assert(get_slice(dropouty, axis, i).asnumpy() == target).all()

     nshape = (10, 10, 10, 10)
     with mx.autograd.train_mode():
         check_dropout_axes(0.25, nshape, axes = (0,))
         check_dropout_axes(0.25, nshape, axes = (1,))
         check_dropout_axes(0.25, nshape, axes = (2,))
         check_dropout_axes(0.25, nshape, axes = (3,))
         check_dropout_axes(0.25, nshape, axes = (0, 1))
         check_dropout_axes(0.25, nshape, axes = (0, 2))
         check_dropout_axes(0.25, nshape, axes = (0, 3))
         check_dropout_axes(0.25, nshape, axes = (1, 2))
         check_dropout_axes(0.25, nshape, axes = (1, 3))
         check_dropout_axes(0.25, nshape, axes = (2, 3))
         check_dropout_axes(0.25, nshape, axes = (0, 1, 2))
         check_dropout_axes(0.25, nshape, axes = (0, 2, 3))
         check_dropout_axes(0.25, nshape, axes = (1, 2, 3))

 @with_seed()
 def test_req():
     data = mx.nd.random.uniform(shape=(1,3,224,224))
     label = mx.nd.random.uniform(shape=(1))
     label[:] = 1
     loss = gluon.loss.SoftmaxCrossEntropyLoss()

     net = nn.HybridSequential()
     net1 = nn.HybridSequential()
     net1.add(nn.Dense(4))
     net2 = nn.HybridSequential()
     net2.add(nn.Dense(3))
     net2.add(nn.Dense(2))
     net.add(net1)
     net.add(net2)
     net.initialize()

     net.hybridize()

     for v in net.collect_params().values():
         v.grad_req = 'add'

     net.collect_params().zero_grad()
     with mx.autograd.record():
         pred = net(data)
         l = loss(pred, label)
         l.backward()
         grad = net[0][0].weight.grad().mean().asnumpy()
         # run twice to check req = add
         pred = net(data)
         l = loss(pred, label)
         l.backward()

     grad_double = net[0][0].weight.grad().mean().asnumpy()
     assert_almost_equal(grad * 2, grad_double)


 @with_seed()
 def test_save_load():
     net = mx.gluon.model_zoo.vision.get_resnet(1, 18, pretrained=True)
     net.save_parameters('test_save_load.params')

     net = mx.gluon.model_zoo.vision.get_resnet(1, 18)
     net.output = mx.gluon.nn.Dense(1000)

     net.load_parameters('test_save_load.params')

     class Network(gluon.Block):
         def __init__(self, **kwargs):
             super(Network, self).__init__(**kwargs)
             with self.name_scope():
                 self.encoders = gluon.nn.Sequential()
                 with self.encoders.name_scope():
                     for _ in range(2):
                         lstm = mx.gluon.rnn.LSTM(200, 1, bidirectional=True)
                         self.encoders.add(lstm)

         def forward(self, x):
             for i in range(2):
                 x = self.encoders[i](x)
             return x
     net = Network()
     net.initialize(mx.init.Xavier(), ctx=mx.cpu())
     net.hybridize()
     x = np.random.rand(32, 10, 10)
     x = mx.nd.array(x).as_in_context(mx.cpu())
     net(x)
     net.save_parameters('tmp.params')
     net2 = Network()
     net2.load_parameters('tmp.params')

 @with_seed()
 def test_symbol_block_save_load():
     class Net(gluon.HybridBlock):
         def __init__(self):
             super(Net, self).__init__()
             with self.name_scope():
                 backbone = gluon.model_zoo.vision.resnet18_v1()
                 data = mx.sym.var('data')
                 featnames = ['stage1_activation0', 'stage2_activation0', 'stage3_activation0']
                 out_names = ['_'.join([backbone.name, featname, 'output']) for featname in featnames]
                 internals = backbone(data).get_internals()
                 outs = [internals[out_name] for out_name in out_names]
                 self.backbone = gluon.SymbolBlock(outs, data, params=backbone.collect_params())
                 self.body = nn.Conv2D(3, 1)

         def hybrid_forward(self, F, x):
             x = self.body(x)
             return self.backbone(x)

     net1 = Net()
     net1.initialize(mx.init.Normal())
     net1.hybridize()
     net1(mx.nd.random.normal(shape=(1, 3, 32, 32)))
     net1.save_parameters('./test_symbol_block_save_load.params')

     net2 = Net()
     net2.load_parameters('./test_symbol_block_save_load.params', ctx=mx.cpu())


 @with_seed()
 def test_hybrid_multi_context():
     net = mx.gluon.model_zoo.vision.get_resnet(1, 18)
     net.initialize(ctx=[mx.cpu(0), mx.cpu(1)])
     net.hybridize()
     net(mx.nd.zeros((1, 3, 32, 32), ctx=mx.cpu(0))).asnumpy()

 @with_seed()
 def test_zero_grad():
     def _test_grad_reset(ctx, dtype='float32', sparse=False, embeddingType=None):
         data = mx.nd.random.uniform(shape=(3,3), dtype=dtype, ctx=ctx)
         if embeddingType is None:
             embeddingType = dtype
         net = nn.Embedding(3, 4, sparse_grad=sparse, prefix='test_zero_grad_', dtype=embeddingType)
         net.initialize(ctx=ctx)
         with mx.autograd.record():
             l = net(data)
             l.backward()
         net.collect_params().zero_grad()
         grad = net.collect_params()['test_zero_grad_weight'].grad()
         assert_almost_equal(grad.asnumpy(), grad.asnumpy() * 0)

     def _test_multi_reset(nArrays, dtype, ctx):
         # Construct the list of non-zeros arrays with random shapes
         arr = []
         for _ in range(nArrays):
             arrType = random.choice(dtype) if isinstance(dtype, list) else dtype
             shape = ()
             for _ in range(np.random.randint(1, 5)):
                 shape = shape + (np.random.randint(1, 10),)
             arr.append(mx.nd.random.uniform(shape=shape, dtype=arrType, ctx=ctx))

         # Reset all arrays
         mx.nd.reset_arrays(*arr, num_arrays=len(arr))

         # Check results
         for i in range(nArrays):
             grad = arr[i].asnumpy()
             assert_almost_equal(grad, grad * 0)


     # Setting context for current test
     ctx = mx.context.current_context()

     # Launching _test_multi_reset 10 times with different types & randomly chosen nArrays
     testedTypes = ['float16', 'float32', 'float64']
     for _ in range(10):
         for type in [testedTypes] + testedTypes:
             _test_multi_reset(np.random.randint(1, 50), type, ctx)

     # Saving value of environment variable, if it was defined
     envVarKey = 'MXNET_STORAGE_FALLBACK_LOG_VERBOSE'
     envVarValue = os.environ[envVarKey] if envVarKey in os.environ else None
     # Changing value of environment variable
     os.environ[envVarKey] = '0'
     for type in ['float16', 'float32', 'float64']:
         for embType in ['float32', 'float64']:
             for sparse in [True, False]:
                 _test_grad_reset(ctx, dtype=type, sparse=sparse, embeddingType=embType)

     # Remove or restore the value of environment variable
     if envVarValue is None:
         del os.environ[envVarKey]
     else:
         os.environ[envVarKey] = envVarValue

 def check_hybrid_static_memory(**kwargs):
     x = mx.nd.random.uniform(shape=(2, 3, 32, 32))
     x.attach_grad()

     net1 = gluon.model_zoo.vision.get_resnet(
         1, 18, pretrained=True, prefix='net_', ctx=mx.context.current_context())
     net2 = gluon.model_zoo.vision.get_resnet(
         1, 18, pretrained=True, prefix='net_', ctx=mx.context.current_context())
     net2.hybridize(**kwargs)
     net1(x)
     net2(x)

     def test(net, x):
         with mx.autograd.record():
             y = net(x) + net(x)
             y.backward()

         grads = {k: v.grad() for k, v in net.collect_params().items() if v.grad_req != 'null'}

         return y, grads

     y1, grads1 = test(net1, x)
     y2, grads2 = test(net2, x)

     assert_almost_equal(y1.asnumpy(), y2.asnumpy(), rtol=1e-3, atol=1e-5)
     for key in grads1:
         assert_almost_equal(grads1[key].asnumpy(), grads2[key].asnumpy(), rtol=1e-3, atol=1e-5)

 @with_seed()
 def test_hybrid_static_memory():
     check_hybrid_static_memory()
     check_hybrid_static_memory(static_alloc=True)
     check_hybrid_static_memory(static_alloc=True, static_shape=True)

 def check_hybrid_static_memory_switching(**kwargs):
     net = gluon.model_zoo.vision.get_resnet(
         1, 18, pretrained=True, ctx=mx.context.current_context())
     net.hybridize(**kwargs)

     x = mx.nd.random.uniform(shape=(4, 3, 32, 32))
     net(x)
     with mx.autograd.record():
         y = net(x)
         y.backward()
     x = mx.nd.random.uniform(shape=(2, 3, 32, 32))
     net(x)
     with mx.autograd.record():
         y = net(x)
         y.backward()
     mx.nd.waitall()

 @with_seed()
 def test_hybrid_static_memory_switching():
     check_hybrid_static_memory_switching()
     check_hybrid_static_memory_switching(static_alloc=True)
     check_hybrid_static_memory_switching(static_alloc=True, static_shape=True)

 @with_seed()
 def test_hook():
     global hook_call_count
     hook_call_count = 0
     global pre_hook_call_count
     pre_hook_call_count = 0

     def call_hook(block, x, y):
         global hook_call_count
         hook_call_count += 1

     def call_pre_hook(block, x):
         global pre_hook_call_count
         pre_hook_call_count += 1

     block = nn.Dense(10)
     block.initialize()
     handle = block.register_forward_hook(call_hook)
     pre_handle = block.register_forward_pre_hook(call_pre_hook)
     block(mx.nd.ones((3, 5)))

     assert hook_call_count == 1
     assert pre_hook_call_count == 1

     handle.detach()
     block(mx.nd.ones((3, 5)))

     assert hook_call_count == 1
     assert pre_hook_call_count == 2

     pre_handle.detach()
     block(mx.nd.ones((3, 5)))
     assert hook_call_count == 1
     assert pre_hook_call_count == 2

 @with_seed()
 def test_op_hook_output_names():
     def check_name(block, expected_names, inputs=None, expected_opr_names=None, monitor_all=False):
         opr_names = []
         output_names = []

         def mon_callback(node_name, opr_name, arr):
             output_names.append(py_str(node_name))
             opr_names.append(py_str(opr_name))

         block.register_op_hook(mon_callback, monitor_all)
         if not inputs:
             block(mx.nd.ones((2, 3, 4)))
         else:
             block(inputs)

         for output_name, expected_name in zip(output_names, expected_names):
             print(output_name)
             assert output_name == expected_name

         if expected_opr_names:
             for opr_name, expected_opr_name in zip(opr_names, expected_opr_names):
                 assert opr_name == expected_opr_name

     # Test with Dense layer
     model = mx.gluon.nn.HybridSequential(prefix="dense_")
     with model.name_scope():
         model.add(mx.gluon.nn.Dense(2))
     model.initialize()
     model.hybridize()
     check_name(model, ["dense_dense0_fwd_output"])

     # Test with Activation, FListInputNames not registered, input name will have _input appended
     model = mx.gluon.nn.HybridSequential(prefix="relu_")
     with model.name_scope():
         model.add(mx.gluon.nn.Activation("relu"))
     model.initialize()
     model.hybridize()
     check_name(model, ["relu_relu0_fwd_output"])

     # Test with Pooling, monitor_all is set to True
     model = mx.gluon.nn.HybridSequential("pool_")
     with model.name_scope():
         model.add(mx.gluon.nn.AvgPool1D())
     model.initialize()
     model.hybridize()
     check_name(model, ['pool_pool0_fwd_data', 'pool_pool0_fwd_output'], expected_opr_names=["Pooling"],
                monitor_all=True)

     # stack two layers and test
     model = mx.gluon.nn.HybridSequential("dense_")
     with model.name_scope():
         model.add(mx.gluon.nn.Dense(2))
         model.add(mx.gluon.nn.Activation("relu"))
     model.initialize()
     model.hybridize()
     check_name(model,
                ['dense_dense0_fwd_data', 'dense_dense0_fwd_weight',
                 'dense_dense0_fwd_bias', 'dense_dense0_fwd_output',
                 'dense_relu0_fwd_input0', 'dense_relu0_fwd_output'], monitor_all=True)

     # check with different hybridize modes
     model.hybridize(static_alloc=True)
     check_name(model,
                ['dense_dense0_fwd_data', 'dense_dense0_fwd_weight',
                 'dense_dense0_fwd_bias', 'dense_dense0_fwd_output',
                 'dense_relu0_fwd_input0', 'dense_relu0_fwd_output'], monitor_all=True)


 @with_seed()
 def test_apply():
     global called_blocks
     called_blocks = []

     def record_name(block):
         global called_blocks
         called_blocks.append(block.name)

     block = nn.HybridSequential(prefix='test_')
     with block.name_scope():
         block.add(nn.Dense(10))
         block.add(nn.Dropout(0.5))
     block.apply(record_name)

     assert called_blocks == ['test_dense0', 'test_dropout0', 'test']


 @with_seed()
 @assert_raises_cudnn_not_satisfied(min_version='5.1.10')
 def test_summary():
     net = gluon.model_zoo.vision.resnet50_v1()
     net.initialize()
     net.summary(mx.nd.ones((32, 3, 224, 224)))

     net2 = nn.Sequential()
     with net2.name_scope():
         net2.add(nn.Embedding(40, 30))
         net2.add(gluon.rnn.LSTM(30))
         net2.add(nn.Dense(40, flatten=False, params=net2[0].params))
     net2.initialize()
     net2.summary(mx.nd.ones((80, 32)))

     net3 = gluon.rnn.LSTM(30)
     net3.initialize()
     begin_state = net3.begin_state(32)
     net3.summary(mx.nd.ones((80, 32, 5)), begin_state)

     net.hybridize()
     assert_raises(AssertionError, net.summary, mx.nd.ones((32, 3, 224, 224)))


 @with_seed()
 def test_legacy_save_params():
     net = gluon.nn.HybridSequential(prefix='')
     with net.name_scope():
         net.add(gluon.nn.Conv2D(10, (3, 3)))
         net.add(gluon.nn.Dense(50))
     net.initialize()
     net(mx.nd.ones((1,1,50,50)))
     a = net(mx.sym.var('data'))
     a.save('test.json')
     net.save_params('test.params')
     model = gluon.nn.SymbolBlock(outputs=mx.sym.load_json(open('test.json', 'r').read()),
                                      inputs=mx.sym.var('data'))
     model.load_params('test.params', ctx=mx.cpu())


 @with_seed()
 def test_sparse_hybrid_block_grad():
     class Embedding(mx.gluon.HybridBlock):
         def __init__(self, num_tokens, embedding_size):
             super(Embedding, self).__init__()
             self.num_tokens = num_tokens

             with self.name_scope():
                 self.embedding = mx.gluon.nn.Embedding(
                     num_tokens, embedding_size, sparse_grad=True)

         def hybrid_forward(self, F, words):
             emb = self.embedding(words)
             return emb + F.ones_like(emb)

     embedding = Embedding(20, 3)
     embedding.initialize()
     embedding.hybridize()

     with mx.autograd.record():
         emb0 = embedding(mx.nd.arange(10)).sum()
         emb1 = embedding(mx.nd.arange(10)).sum()
         loss = emb0 + emb1
     loss.backward()
     grad = embedding.embedding.weight.grad().asnumpy()
     assert (grad[:10] == 2).all()
     assert (grad[10:] == 0).all()

 @with_seed()
 def test_sparse_hybrid_block():
     class Linear(mx.gluon.HybridBlock):
         def __init__(self, units):
             super(Linear, self).__init__()
             with self.name_scope():
                 self.w = self.params.get('w', shape=(units, units))

         def hybrid_forward(self, F, x, w):
             return F.dot(x, w)

     class SparseBlock(mx.gluon.HybridBlock):
         def __init__(self, units):
             super(SparseBlock, self).__init__()
             with self.name_scope():
                 self.net = Linear(units)

         def hybrid_forward(self, F, x):
             return self.net(x) * x

     block = SparseBlock(2)
     block.initialize()
     block.hybridize()
     x = mx.nd.ones((2,2)).tostype('csr')
     with mx.autograd.record():
         z = block(x) + block(x)
     z.backward()
     assert (block.net.w.grad().asnumpy() == 4).all()

 def test_hybrid_static_memory_recording():
     net = gluon.model_zoo.vision.get_resnet(
         1, 18, pretrained=True, ctx=mx.context.current_context())
     net.hybridize(static_alloc=True)

     x = mx.nd.random.uniform(shape=(1, 3, 32, 32))
     with mx.autograd.record(True):
         net(x)
     net(x)


 def test_share_inputs_outputs():
     class TestIOBackward(gluon.HybridBlock):
         def __init__(self, prefix=None, params=None):
             super(TestIOBackward, self).__init__(prefix=prefix, params=params)

         def hybrid_forward(self, F, in1, in2):
             return in1 + in2

     class TestIOForward(gluon.HybridBlock):
         def __init__(self, prefix=None, params=None):
             super(TestIOForward, self).__init__(prefix=prefix, params=params)

         def hybrid_forward(self, F, in1):
             return in1

     d1 = mx.nd.arange(10)
     d2 = mx.nd.arange(10)

     params=[{'inline_limit':0},
             {'inline_limit':0, 'static_alloc':True},
             {'inline_limit':0, 'static_alloc':True, 'static_shape':True}]
     # Test the case that inputs and outputs of a forward graph share NDArrays.
     for param in params:
         t = TestIOForward()
         t.hybridize(**param)
         for i in range(5):
             d1.attach_grad()
             out_grad = mx.nd.random.uniform(shape=(10))
             res = t(d1)
             assert_almost_equal(res.asnumpy(), d1.asnumpy())

     param = deepcopy(params[2])
     param['param_indices'] = (1)
     param['data_indices'] = (0)
     params.append(param)
     # Test the case that inputs and outputs of a backward graph share NDArrays.
     for param in params:
         t = TestIOBackward()
         t.hybridize(**param)
         for i in range(5):
             d1.attach_grad()
             d2.attach_grad()
             out_grad = mx.nd.random.uniform(shape=(10))
             with mx.autograd.record():
                 res = t(d1, d2)
             res.backward(out_grad=out_grad)
             assert_almost_equal(out_grad.asnumpy(), d1.grad.asnumpy())
             assert_almost_equal(out_grad.asnumpy(), d2.grad.asnumpy())


 def test_grad_graph_change():
     class Model(mx.gluon.HybridBlock):
         def hybrid_forward(self, F, array, index):
             row = array.take(index)
             return row, index
     array = mx.nd.arange(3)
     index = mx.nd.array([2])
     array.attach_grad()
     model = Model()
     model.hybridize(inline_limit=0)
     with mx.autograd.record(train_mode=True):
         row, _ = model(array, index)
     row.backward()


 def check_layer_forward_withinput(net, x):
     x_hybrid = x.copy()
     x.attach_grad()
     x_hybrid.attach_grad()
     net.collect_params().initialize()
     with mx.autograd.record():
         out1 = net(x)
     out1.backward()
     net.hybridize()
     with mx.autograd.record():
         out2 = net(x_hybrid)
     out2.backward()
     mx.test_utils.assert_almost_equal(x.grad.asnumpy(), x_hybrid.grad.asnumpy(), rtol=1e-5, atol=1e-6)
     mx.test_utils.assert_almost_equal(out1.asnumpy(), out2.asnumpy(), rtol=1e-5, atol=1e-6)

 @with_seed()
 def test_conv2d_16c():
     chn_list = [16, 256]
     kernel_list = [1, 3]
     kernel_list.append(224)
     batch_size = 4
     class Net(gluon.HybridBlock):
         def __init__(self,
                      chn_num,
                      kernel,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = gluon.nn.Conv2D(chn_num, (kernel, kernel))

         def hybrid_forward(self, F, x):
             out = self.conv0(x)
             return out

     x = mx.nd.random.uniform(-1.0, 1.0, shape=(batch_size, 3, 224, 224))
     for i in range(len(chn_list)):
         for j in range(len(kernel_list)):
             net = Net(chn_list[i], kernel_list[j])
             check_layer_forward_withinput(net, x)

 @with_seed()
 def test_group_conv2d_16c():
     grp_list = [16]
     input_size_list = np.random.randint(low=3, high=65, size=10).tolist()
     kernel_list = [1, 3]
     batch_size = 4
     class Net(gluon.HybridBlock):
         def __init__(self,
                      chn_num,
                      kernel,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = gluon.nn.Conv2D(chn_num, (1, 1))
                 self.conv1 = gluon.nn.Conv2D(chn_num, (kernel, kernel), groups=chn_num)

         def hybrid_forward(self, F, x):
             y = self.conv0(x)
             out = self.conv1(y)
             return out

     for i in range(len(input_size_list)):
         x = mx.nd.random.uniform(-1.0, 1.0, shape=(batch_size, 3, input_size_list[i], input_size_list[i]))
         for j in range(len(grp_list)):
             for k in range(len(kernel_list)):
                 net = Net(grp_list[j], kernel_list[k])
                 check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_deconv2d_16c():
     in_chn_list = [1024, 512, 256, 128, 64, 32, 16]
     out_chn_list = [512, 256, 128, 64, 32, 16, 3]
     kernel_list = [1, 3, 5, 7]
     in_shape = [4, 8, 16, 32, 64, 224]
     batch_size = 4
     class Net(gluon.HybridBlock):
         def __init__(self, chn_num, kernel, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.deconv0 = gluon.nn.Conv2DTranspose(chn_num, (kernel, kernel))

         def hybrid_forward(self, F, x):
             out = self.deconv0(x)
             return out
     for i in range(len(in_shape)):
         x = mx.nd.random.uniform(-1.0, 1.0, shape=(batch_size, in_chn_list[i], in_shape[i], in_shape[i]))
         for j in range(len(kernel_list)):
             net = Net(out_chn_list[i], kernel_list[j])
             check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_batchnorm_16c():
     chn_list = [16, 1024]
     shape = np.random.randint(low=1, high=300, size=10)
     shape_list = []
     for i in range(len(shape)):
         shape_list.append((shape[i], shape[i]))
     batch_size = 4
     class Net(gluon.HybridBlock):
         def __init__(self,
                      chn_num,
                      kernel,
                      axis,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = gluon.nn.Conv2D(chn_num, (kernel, kernel))
                 self.bn0   = gluon.nn.BatchNorm(axis=axis)

         def hybrid_forward(self, F, x):
             conv = self.conv0(x)
             out = self.bn0(conv)
             return out

     for i in range(len(chn_list)):
         for j in range(len(shape_list)):
             shape = (batch_size, ) + (3,) + shape_list[j]
             x = mx.nd.random.uniform(-1.0, 1.0, shape=shape)
             net = Net(chn_list[i], 1, 1)
             check_layer_forward_withinput(net, x)


 @with_seed()
 def test_concat():
     chn_list = [16, 64]
     shapes = [1, 3, 5]
     input_num = np.random.randint(low=2, high=11)
     shape_list = []
     for i in range(len(shapes)):
         shape_list.append((shapes[i], shapes[i]))
     batch_size = 4
     class Net(gluon.HybridBlock):
         def __init__(self,
                      check_dim,
                      input_num,
                      chn_num,
                      kernel,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 from mxnet.gluon.contrib.nn import HybridConcurrent
                 self.concat = HybridConcurrent(axis=check_dim)
                 for i in range(input_num):
                     self.concat.add(gluon.nn.Conv2D(chn_num, (kernel, kernel)))

         def hybrid_forward(self, F, x):
             return self.concat(x)

     for s in range(len(shape_list)):
         shape = (batch_size,) + (3,) + shape_list[i]
         x = mx.nd.random.uniform(-1.0, 1.0, shape=shape)
         for i in range(len(chn_list)):
             for axis in range(4):
                 net = Net(axis, input_num, chn_list[i], 1)
                 check_layer_forward_withinput(net, x)

 @with_seed()
 def test_reshape_conv():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(64, (3, 3))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((0, 0, 128, 32))
             out = self.conv0(x_reshape)
             return out
     x = mx.nd.random.uniform(shape=(4, 3, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_conv_reshape_conv():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(64, (3, 3))
                 self.conv1 = nn.Conv2D(128, (3, 3))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((0, 0, 128, 32))
             y = self.conv0(x_reshape)
             "spatial shape of y is (62, 62)"
             y_reshape = y.reshape((0, 0, 124, 31))
             out = self.conv1(y_reshape)
             return out
     x = mx.nd.random.uniform(shape=(4, 3, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_slice_conv():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(16, (3, 3))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=(0, 2, 0, 0), end=(4, 5, 32, 32))
             out = self.conv0(x_slice)
             return out
     x = mx.nd.random.uniform(shape=(8, 6, 32, 32))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_conv_slice_conv():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(32, (3, 3))
                 self.conv1 = nn.Conv2D(16, (1, 1))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=(0, 0, 0, 0), end=(4, 16, 16, 16))
             y = self.conv0(x_slice)
             "shape of y is (4, 32, 14, 14)"
             y_slice = y.slice(begin=(0, 0, 0, 0), end=(4, 16, 3, 3))
             out = self.conv1(y_slice)
             return out
     x = mx.nd.random.uniform(shape=(4, 32, 32, 32))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_conv_reshape_conv():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(64, (3, 3))
                 self.conv1 = nn.Conv2D(128, (3, 3))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=(0, 0, 1, 1), end=(4, 16, 33, 33))
             y = self.conv0(x_slice)
             "shape of y is (4, 64, 30, 30)"
             y_reshape = y.reshape((0, 0, 60, 15))
             out = self.conv1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_reshape_conv_slice_conv():
     """
     This test will test gluon Conv2d computation with ndarray reshape and slice
     """
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(16, (3, 3))
                 self.conv1 = nn.Conv2D(32, (3, 3))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((0, 0, 64, 16))
             y = self.conv0(x_reshape)
             "shape of y is (4, 16, 62, 14)"
             y_slice = y.slice(begin=(0, 0, 0, 0), end=(2, 16, 14, 14))
             out = self.conv1(y_slice)
             return out
     x = mx.nd.random.uniform(shape=(4, 3, 32, 32))
     net = Net()
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_reshape_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = np.random.randint(1, 17)
                 self.dense0 = nn.Dense(channel0)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((8, 64, 128, -1))
             out = self.dense0(x_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = np.random.randint(1, 17)
                 self.dense0 = nn.Dense(channel0)
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=tuple(self.slice[0]),
                               end=tuple(self.slice[1]))
             out = self.dense0(x_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 32, 64, 64))
     slice = [[0, 16, 0, 0], [4, 32, 32, 32]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_slice_dense_slice_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = 32
                 channel1 = np.random.randint(1, 17)
                 self.dense0 = nn.Dense(channel0)
                 self.dense1 = nn.Dense(channel1)
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=tuple(self.slice[0]), end=tuple(self.slice[1]))
             y = self.dense0(x_slice)
             y_slice = y.slice(begin=(1, 0), end=(3, 10))
             out = self.dense1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 32, 64, 64))
     slice = [[0, 16, 0, 0], [4, 32, 32, 32]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_reshape_dense_reshape_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = np.random.randint(1, 17)
                 channel1 = np.random.randint(1, 33)
                 self.dense0 = nn.Dense(channel0)
                 self.dense1 = nn.Dense(channel1)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((4, 16, 128, 32))
             y = self.dense0(x_reshape)
             y_reshape = y.reshape((1, -1))
             out = self.dense1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 16, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_dense_reshape_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = np.random.randint(1, 17)
                 channel1 = np.random.randint(1, 17)
                 self.dense0 = nn.Dense(channel0)
                 self.dense1 = nn.Dense(channel1)
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=tuple(self.slice[0]), end=tuple(self.slice[1]))
             y = self.dense0(x_slice)
             y_reshape = y.reshape((1, -1))
             out = self.dense1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(16, 32, 64, 64))
     slice = [[0, 16, 0, 0], [4, 32, 32, 32]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_reshape_dense_slice_dense():
     class Net(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 channel0 = 64
                 channel1 = np.random.randint(1, 17)
                 self.dense0 = nn.Dense(channel0)
                 self.dense1 = nn.Dense(channel1)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape((4, 16, 128, 32))
             y = self.dense0(x_reshape)
             y_slice = y.slice(begin=(1, 32), end=(3, 64))
             out = self.dense1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(4, 16, 64, 64))
     net = Net()
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(96, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.reshape = shape

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_reshape = x_in.reshape(self.reshape)
             out = self.bn0(x_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 64, 64))
     shape = (4, 64, 64, -1)
     net = Net(shape)
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(128, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_slice = x_in.slice(begin=tuple(self.slice[0]),
                               end=tuple(self.slice[1]))
             out = self.bn0(x_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     slice = [[0, 0, 0, 0], [4, 32, 32, 32]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_batchnorm_slice_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(128, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.bn1 = nn.BatchNorm()
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_slice = x_in.slice(begin=tuple(self.slice[0][0]), end=tuple(self.slice[0][1]))
             y = self.bn0(x_slice)
             y_slice = y.slice(begin=tuple(self.slice[1][0]), end=tuple(self.slice[1][1]))
             out = self.bn1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     slice = [[[0, 0, 0, 0], [4, 32, 32, 32]], [[0, 0, 0, 0], [2, 64, 16, 16]]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_batchnorm_reshape_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(128, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.bn1 = nn.BatchNorm()
                 self.reshape = shape

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_reshape = x_in.reshape(self.reshape[0])
             y = self.bn0(x_reshape)
             y_reshape = y.reshape(self.reshape[1])
             out = self.bn1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 64, 64))
     shape = [(4, 64, 64, -1), (4, 128, -1, 32)]
     net = Net(shape)
     check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_batchnorm_reshape_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(128, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.bn1 = nn.BatchNorm()
                 self.reshape = shape
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_slice = x_in.slice(begin=tuple(self.slice[0]), end=tuple(self.slice[1]))
             y = self.bn0(x_slice)
             y_reshape = y.reshape(self.reshape)
             out = self.bn1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     slice = [[0, 0, 0, 0], [4, 32, 32, 32]]
     shape = (1, 128, 64, -1)
     net = Net(shape, slice)
     check_layer_forward_withinput(net, x)


 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_batchnorm_slice_batchnorm():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.conv0 = nn.Conv2D(128, (1, 1))
                 self.bn0 = nn.BatchNorm()
                 self.bn1 = nn.BatchNorm()
                 self.reshape = shape
                 self.slice = slice

         def hybrid_forward(self, F, x):
             x_in = self.conv0(x)
             x_reshape = x_in.reshape(self.reshape)
             y = self.bn0(x_reshape)
             y_slice = y.slice(begin=tuple(self.slice[0]), end=tuple(self.slice[1]))
             out = self.bn1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 64, 64))
     slice = [[0, 0, 0, 0], [2, 64, 32, 32]]
     shape = (4, 64, 64, -1)
     net = Net(shape, slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_pooling2d():
     max_pooling = nn.MaxPool2D(strides=(2, 3), padding=(1, 1))
     avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1))
     global_maxpooling = nn.GlobalMaxPool2D()
     global_avgpooling = nn.GlobalAvgPool2D()
     pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
     class Net(gluon.HybridBlock):
         def __init__(self,
                      shape,
                      pooling_layer,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.pool0 = pooling_layer

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             out = self.pool0(x_reshape)
             return out

     x = mx.nd.random.uniform(shape=(4, 32, 32, 32))
     shape = (4, 64, 64, -1)
     for i in range(len(pooling_layers)):
         net = Net(shape, pooling_layers[i])
         check_layer_forward_withinput(net, x)

 @with_seed()
 def test_slice_pooling2d():
     # transpose shape to bring feature dimension 'c' from 2nd position to last
     def transpose(shape):
         return (shape[0],) + shape[2:] + (shape[1],)

     for layout in ['NCHW', 'NHWC']:
         max_pooling = nn.MaxPool2D(strides=(2, 3), padding=(1, 1), layout=layout)
         avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1), layout=layout)
         global_maxpooling = nn.GlobalMaxPool2D(layout=layout)
         global_avgpooling = nn.GlobalAvgPool2D(layout=layout)
         pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
         class Net(gluon.HybridBlock):
             def __init__(self,
                          slice,
                          pooling_layer,
                          **kwargs):
                 super(Net, self).__init__(**kwargs)
                 with self.name_scope():
                     self.slice = slice
                     self.pool0 = pooling_layer

             def hybrid_forward(self, F, x):
                 x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
                 out = self.pool0(x_slice)
                 return out

         xshape = (16, 128, 256, 256)
         slice_shape = (4, 16, 32, 64)
         if layout == 'NHWC':
             xshape = transpose(xshape)
             slice_shape = transpose(slice_shape)
         x = mx.nd.random.uniform(shape=xshape)
         slice = [(0, 0, 0, 0), slice_shape]
         for i in range(len(pooling_layers)):
             net = Net(slice, pooling_layers[i])
             check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_pooling2d_reshape_pooling2d():
     max_pooling = nn.MaxPool2D(strides=(2, 2), padding=(1, 1))
     avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1))
     global_maxpooling = nn.GlobalMaxPool2D()
     global_avgpooling = nn.GlobalAvgPool2D()
     pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
     class Net(gluon.HybridBlock):
         def __init__(self,
                      shape,
                      pooling_layer1,
                      pooling_layer2,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.pool0 = pooling_layer1
                 self.pool1 = pooling_layer2

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape[0])
             y = self.pool0(x_reshape)
             y_reshape = y.reshape(self.reshape[1])
             out = self.pool1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     shape = [(128, 256, 64, -1), (128, 256, 11, -1)]
     for i in range(len(pooling_layers)):
         for j in range(len(pooling_layers)):
             if isinstance(pooling_layers[i], (nn.GlobalMaxPool2D, nn.GlobalAvgPool2D)):
                 shape[1] = (256, 128, 1, 1)
             net = Net(shape, pooling_layers[i], pooling_layers[j])
             check_layer_forward_withinput(net, x)

 @with_seed()
 def test_slice_pooling2d_slice_pooling2d():
     max_pooling = nn.MaxPool2D(strides=(2, 3), padding=(1, 1))
     avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1))
     global_maxpooling = nn.GlobalMaxPool2D()
     global_avgpooling = nn.GlobalAvgPool2D()
     pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
     class Net(gluon.HybridBlock):
         def __init__(self,
                      slice,
                      pooling_layer1,
                      pooling_layer2,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.slice = slice
                 self.pool0 = pooling_layer1
                 self.pool1 = pooling_layer2

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0][0], end=self.slice[0][1])
             y = self.pool0(x_slice)
             y_slice = y.slice(begin=self.slice[1][0], end=self.slice[1][1])
             out = self.pool1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     slice = [[(8, 0, 100, 50), (16, -1, -1, -1)], [(0, 64, 0, 50), (2, -1, -1, -1)]]
     for i in range(len(pooling_layers)):
         for j in range(len(pooling_layers)):
             if isinstance(pooling_layers[i], (nn.GlobalMaxPool2D, nn.GlobalAvgPool2D)):
                 slice[1] = [(0, 64, 0, 0), (2, -1, 1, 1)]
             net = Net(slice, pooling_layers[i], pooling_layers[j])
             check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_pooling2d_reshape_pooling2d():
     max_pooling = nn.MaxPool2D(strides=(2, 3), padding=(1, 1))
     avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1))
     global_maxpooling = nn.GlobalMaxPool2D()
     global_avgpooling = nn.GlobalAvgPool2D()
     pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
     class Net(gluon.HybridBlock):
         def __init__(self,
                      shape,
                      slice,
                      pooling_layer1,
                      pooling_layer2,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.pool0 = pooling_layer1
                 self.pool1 = pooling_layer2

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
             y = self.pool0(x_slice)
             y_reshape = y.reshape(self.reshape)
             out = self.pool1(y_reshape)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     slice = [(8, 0, 100, 50), (16, 128, 256, 256)]
     shape = (32, -1, 0, 0)
     for i in range(len(pooling_layers)):
         for j in range(len(pooling_layers)):
             net = Net(shape, slice, pooling_layers[i], pooling_layers[j])
             check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_pooling2d_slice_pooling2d():
     max_pooling = nn.MaxPool2D(strides=(2, 3), padding=(1, 1))
     avg_pooling = nn.AvgPool2D(strides=(2, 2), padding=(1, 1))
     global_maxpooling = nn.GlobalMaxPool2D()
     global_avgpooling = nn.GlobalAvgPool2D()
     pooling_layers = [max_pooling, avg_pooling, global_maxpooling, global_avgpooling]
     class Net(gluon.HybridBlock):
         def __init__(self,
                      shape,
                      slice,
                      pooling_layer1,
                      pooling_layer2,
                      **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.pool0 = pooling_layer1
                 self.pool1 = pooling_layer2

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             y = self.pool0(x_reshape)
             y_slice = y.slice(begin=self.slice[0], end=self.slice[1])
             out = self.pool1(y_slice)
             return out

     x = mx.nd.random.uniform(shape=(16, 128, 256, 256))
     shape = (0, 512, 64, -1)
     slice = [(8, 256, 10, 20), (-1, -1, -1, 70)]
     for i in range(len(pooling_layers)):
         for j in range(len(pooling_layers)):
             if isinstance(pooling_layers[i], (nn.GlobalMaxPool2D, nn.GlobalAvgPool2D)):
                 slice = [(8, 256, 0, 0), (-1, -1, 1, 1)]
             net = Net(shape, slice, pooling_layers[i], pooling_layers[j])
             check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.conv0 = nn.Conv2DTranspose(64, (3, 3))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             out = self.conv0(x_reshape)
             return out
     x = mx.nd.random.uniform(shape=(4, 16, 32, 32))
     shape = (4, 16, 64, -1)
     net = Net(shape)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.slice = slice
                 self.conv0 = nn.Conv2DTranspose(64, (3, 3))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
             out = self.conv0(x_slice)
             return out
     x = mx.nd.random.uniform(shape=(8, 32, 64, 64))
     slice = [(0, 16, 0, 0), (4, 32, 32, 32)]
     net = Net(slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_deconv_reshape_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.conv0 = nn.Conv2DTranspose(32, (3, 3))
                 self.conv1 = nn.Conv2DTranspose(64, (3, 3), strides=(2, 2))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape[0])
             y = self.conv0(x_reshape)
             "shape of y is (4, 32, 66, 18)"
             y_reshape = y.reshape(self.reshape[1])
             out = self.conv1(y_reshape)
             return out
     x = mx.nd.random.uniform(shape=(4, 16, 32, 32))
     shape = [(4, 16, 64, -1), (4, 32, 33, -1)]
     net = Net(shape)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_deconv_slice_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.slice = slice
                 self.conv0 = nn.Conv2DTranspose(32, (3, 3))
                 self.conv1 = nn.Conv2DTranspose(64, (3, 3), strides=(2, 2))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0][0], end=self.slice[0][1])
             y = self.conv0(x_slice)
             "shape of y is (4, 32, 66, 18)"
             y_slice = y.slice(begin=self.slice[1][0], end=self.slice[1][1])
             out = self.conv1(y_slice)
             return out
     x = mx.nd.random.uniform(shape=(8, 32, 64, 64))
     slice = [[(0, 0, 0, 0), (4, 16, 32, 32)], [(0, 0, 0, 0), (2, 16, 16, 16)]]
     net = Net(slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_reshape_deconv_slice_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.conv0 = nn.Conv2DTranspose(32, (3, 3))
                 self.conv1 = nn.Conv2DTranspose(64, (3, 3), strides=(2, 2))

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             y = self.conv0(x_reshape)
             "shape of y is (4, 32, 66, 18)"
             y_slice = y.slice(begin=self.slice[0], end=self.slice[1])
             out = self.conv1(y_slice)
             return out
     x = mx.nd.random.uniform(shape=(4, 16, 32, 32))
     shape = (4, 16, 64, -1)
     slice = [(0, 0, 0, 0), (2, 16, 16, 16)]
     net = Net(shape, slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 @unittest.skip('skippping temporarily, tracked by https://github.com/apache/incubator-mxnet/issues/11164')
 def test_slice_deconv_reshape_deconv():
     class Net(gluon.HybridBlock):
         def __init__(self, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.conv0 = nn.Conv2DTranspose(32, (3, 3))
                 self.conv1 = nn.Conv2DTranspose(96, (3, 3), strides=(2, 2))

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
             y = self.conv0(x_slice)
             "shape of y is (4, 32, 34, 34)"
             y_reshape = y.reshape(self.reshape)
             out = self.conv1(y_reshape)
             return out
     x = mx.nd.random.uniform(shape=(8, 32, 64, 64))
     shape = (4, 64, 34, -1)
     slice = [(4, 0, 0, 0), (8, 16, 32, 32)]
     net = Net(shape, slice)
     check_layer_forward_withinput(net, x)

 @with_seed()
 def test_reshape_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.act = nn.Activation(act)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             out = self.act(x_reshape)
             return out
     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for act in acts:
         x = mx.nd.random.uniform(-1, 1, shape=(4, 16, 32, 32))
         shape = (4, 32, 32, -1)
         net = Net(act, shape)
         check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.slice = slice
                 self.act = nn.Activation(act)

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
             out = self.act(x_slice)
             return out

     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for act in acts:
         x = mx.nd.random.uniform(-1, 1, shape=(8, 32, 64, 64))
         slice = [(0, 16, 32, 32), (4, 32, 64, 64)]
         net = Net(act, slice)
         check_layer_forward_withinput(net, x)


 @with_seed()
 def test_reshape_activation_reshape_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act0, act1, shape, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.act0 = nn.Activation(act0)
                 self.act1 = nn.Activation(act1)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape[0])
             y = self.act0(x_reshape)
             y_reshape = y.reshape(self.reshape[1])
             out = self.act1(y_reshape)
             return out
     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for idx0, act0 in enumerate(acts):
         for idx1, act1 in enumerate(acts):
             if idx1 == idx0:
                 continue
             x = mx.nd.random.uniform(-1, 1, shape=(4, 16, 32, 32))
             shape = [(4, 32, 32, -1), (4, 32, 16, -1)]
             net = Net(act0, act1, shape)
             check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_activation_slice_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act0, act1, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.slice = slice
                 self.act0 = nn.Activation(act0)
                 self.act1 = nn.Activation(act1)

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0][0], end=self.slice[0][1])
             y = self.act0(x_slice)
             y_slice = y.slice(begin=self.slice[1][0], end=self.slice[1][1])
             out = self.act1(y_slice)
             return out
     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for idx0, act0 in enumerate(acts):
         for idx1, act1 in enumerate(acts):
             if idx1 == idx0:
                 continue
             x = mx.nd.random.uniform(-1, 1, shape=(8, 32, 64, 64))
             slice = [[(0, 16, 32, 32), (4, 32, 64, 64)], [(2, 0, 16, 16), (4, 16, 32, 32)]]
             net = Net(act0, act1, slice)
             check_layer_forward_withinput(net, x)


 @with_seed()
 def test_reshape_activation_slice_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act0, act1, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.act0 = nn.Activation(act0)
                 self.act1 = nn.Activation(act1)

         def hybrid_forward(self, F, x):
             x_reshape = x.reshape(self.reshape)
             y = self.act0(x_reshape)
             y_slice = y.slice(begin=self.slice[0], end=self.slice[1])
             out = self.act1(y_slice)
             return out
     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for idx0, act0 in enumerate(acts):
         for idx1, act1 in enumerate(acts):
             if idx1 == idx0:
                 continue
             x = mx.nd.random.uniform(-1, 1, shape=(4, 16, 32, 32))
             shape = (4, 32, 32, -1)
             slice = [(0, 0, 0, 0), (2, 16, 16, 16)]
             net = Net(act0, act1, shape, slice)
             check_layer_forward_withinput(net, x)


 @with_seed()
 def test_slice_activation_reshape_activation():
     class Net(gluon.HybridBlock):
         def __init__(self, act0, act1, shape, slice, **kwargs):
             super(Net, self).__init__(**kwargs)
             with self.name_scope():
                 self.reshape = shape
                 self.slice = slice
                 self.act0 = nn.Activation(act0)
                 self.act1 = nn.Activation(act1)

         def hybrid_forward(self, F, x):
             x_slice = x.slice(begin=self.slice[0], end=self.slice[1])
             y = self.act0(x_slice)
             y_reshape = y.reshape(self.reshape)
             out = self.act1(y_reshape)
             return out
     acts = ["relu", "sigmoid", "tanh", "softrelu", "softsign"]
     for idx0, act0 in enumerate(acts):
         for idx1, act1 in enumerate(acts):
             if idx1 == idx0:
                 continue
             x = mx.nd.random.uniform(-1, 1, shape=(8, 32, 64, 64))
             slice = [(0, 16, 32, 32), (4, 32, 64, 64)]
             shape = (4, 32, 32, -1)
             net = Net(act0, act1, shape, slice)
             check_layer_forward_withinput(net, x)

 @with_seed()
 def test_np_shape_parameters():
     class Foo(gluon.Block):
         def __init__(self, **kwargs):
             super(Foo, self).__init__(**kwargs)
             self.dense = gluon.nn.Dense(16)
         def forward(self, x):
             return self.dense(x)

     with mx.np_shape(True):
         z = mx.nd.zeros((2,2016))
         print(z.shape)
         foo = Foo()
         foo.initialize()
         print(foo(z).shape)

 @with_seed()
 def test_gluon_param_load():
     net = mx.gluon.nn.Dense(10, in_units=10)
     net.initialize()
     net.save_parameters('test_gluon_param_load.params')
     net.cast('float16')
     net.load_parameters('test_gluon_param_load.params', cast_dtype=True)
     mx.nd.waitall()

 @with_seed()
 def test_gluon_param_load_dtype_source():
     net = mx.gluon.nn.Dense(10, in_units=10)
     net.initialize()
     net.cast('float16')
     net.save_parameters('test_gluon_param_load_dtype_source.params')
     net.cast('float32')
     net.load_parameters('test_gluon_param_load_dtype_source.params', cast_dtype=True, dtype_source="saved")
     assert net.weight.dtype == np.float16
     mx.nd.waitall()

 @with_seed()
 def test_squeeze_consistency():
     class Foo(gluon.HybridBlock):
         def __init__(self, inplace, **kwargs):
             super(Foo, self).__init__(**kwargs)
             self.inplace = inplace

         def forward(self, x):
             return x.squeeze(inplace=self.inplace)

     for inplace in (True, False):
         block = Foo(inplace)
         block.hybridize()
         shape = (np.random.randint(1, 10), np.random.randint(1, 10), 1)
         block(mx.nd.ones(shape))

 @with_seed()
 def test_reqs_switching_training_inference():
     class Foo(gluon.HybridBlock):
         def __init__(self, **kwargs):
             super(Foo, self).__init__(**kwargs)

         def hybrid_forward(self, F, x):
             y = 2 * x
             return F.sqrt(x) + F.sqrt(y)

     f = Foo()
     f.hybridize(static_alloc=True)
     x = mx.nd.ones(shape=(10,10))
     x.attach_grad()
     x2 = mx.nd.ones(shape=x.shape) * 2
     x2.attach_grad()

     # Call first in training mode
     with mx.autograd.record():
         y = f(x)
     y.backward()

     grad1 = x.grad.asnumpy()

     # Compute the gradient with some other input
     with mx.autograd.record():
         y = f(x2)
     y.backward()

     # Call inference mode
     y = f(x)

     # Call training mode again
     with mx.autograd.record():
         y = f(x)
     y.backward()

     grad2 = x.grad.asnumpy()

     mx.test_utils.assert_almost_equal(grad1, grad2)

 if __name__ == '__main__':
     import nose
     nose.runmodule()