julia/examples/mnist/mlp-test.jl - mxnet - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.

 # This file is primarily to be included from runtest.jl. We tried to cover various
 # features of MXNet.jl in this example in order to detect regression errors.

 module MNISTTest

 using MXNet
 using Test

 include("mnist-data.jl")

 function get_mnist_mlp()
   @mx.chain mx.Variable(:data)                   =>
     mx.FullyConnected(name=:fc1, num_hidden=128) =>
     mx.Activation(name=:relu1, act_type=:relu)   =>
     mx.FullyConnected(name=:fc2, num_hidden=64)  =>
     mx.Activation(name=:relu2, act_type=:relu)   =>
     mx.FullyConnected(name=:fc3, num_hidden=10)  =>
     mx.SoftmaxOutput(name=:softmax)
 end

 get_mnist_data(batch_size = 100) = get_mnist_providers(batch_size)

 function mnist_fit_and_predict(optimizer, initializer, n_epoch)
   mlp = get_mnist_mlp()
   train_provider, eval_provider = get_mnist_data()

   # setup model
   model = mx.FeedForward(mlp, context = mx.cpu())

   # fit parameters
   cp_prefix = "mnist-test-cp"
   mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=n_epoch,
          initializer=initializer, callbacks=[mx.speedometer(), mx.do_checkpoint(cp_prefix, save_epoch_0=true)])

   # make sure the checkpoints are saved
   @test isfile("$cp_prefix-symbol.json")
   for i_epoch = 0:n_epoch
     @test isfile(mx.format("{1}-{2:04d}.params", cp_prefix, i_epoch))
   end
   mlp_load = mx.load("$cp_prefix-symbol.json", mx.SymbolicNode)
   @test mx.to_json(mlp_load) == mx.to_json(mlp)
   mlp_load = mx.from_json(read("$cp_prefix-symbol.json", String), mx.SymbolicNode)
   @test mx.to_json(mlp_load) == mx.to_json(mlp)

   #--------------------------------------------------------------------------------
   # the predict API
   probs = mx.predict(model, eval_provider)

   # collect all labels from eval data
   labels = Array[]
   for batch in eval_provider
     push!(labels, copy(mx.get(eval_provider, batch, :softmax_label)))
   end
   labels = cat(labels..., dims = 1)

   # Now we use compute the accuracy
   correct = 0
   for i = 1:length(labels)
     # labels are 0...9
     if argmax(probs[:,i]) == labels[i]+1
       correct += 1
     end
   end
   accuracy = 100correct/length(labels)
   println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy))

   # try to call visualization
   dot_code = mx.to_graphviz(mlp)

   return accuracy
 end

 function test_mnist_mlp()
   @info("MNIST::SGD")
   @test mnist_fit_and_predict(mx.SGD(η=.2), mx.UniformInitializer(.01), 2) > 90

   @info("MNIST::SGD::η scheduler")
   @test mnist_fit_and_predict(mx.SGD(η_sched=mx.LearningRate.Inv(.25)),
                               mx.UniformInitializer(.01), 2) > 90

   @info("MNIST::SGD::momentum μ")
   @test mnist_fit_and_predict(mx.SGD(η=.1, μ=.9), mx.UniformInitializer(.01), 2) > 90

   @info("MNIST::ADAM")
   @test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90

   @info("MNIST::AdaGrad")
   @test mnist_fit_and_predict(mx.AdaGrad(), mx.NormalInitializer(), 2) > 90

   @info("MNIST::AdaDelta")
   @test mnist_fit_and_predict(mx.AdaDelta(), mx.NormalInitializer(), 2) > 90

   @info("MNIST::AdaMax")
   @test mnist_fit_and_predict(mx.AdaMax(), mx.NormalInitializer(), 2) > 90

   @info("MNIST::RMSProp")
   @test mnist_fit_and_predict(mx.RMSProp(), mx.NormalInitializer(), 2) > 90

   @info("MNIST::Nadam")
   @test mnist_fit_and_predict(mx.Nadam(), mx.NormalInitializer(), 2) > 90
 end

 test_mnist_mlp()

 end # module MNISTTest
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.

	# This file is primarily to be included from runtest.jl. We tried to cover various
	# features of MXNet.jl in this example in order to detect regression errors.

	module MNISTTest

	using MXNet
	using Test

	include("mnist-data.jl")

	function get_mnist_mlp()
	@mx.chain mx.Variable(:data) =>
	mx.FullyConnected(name=:fc1, num_hidden=128) =>
	mx.Activation(name=:relu1, act_type=:relu) =>
	mx.FullyConnected(name=:fc2, num_hidden=64) =>
	mx.Activation(name=:relu2, act_type=:relu) =>
	mx.FullyConnected(name=:fc3, num_hidden=10) =>
	mx.SoftmaxOutput(name=:softmax)
	end

	get_mnist_data(batch_size = 100) = get_mnist_providers(batch_size)

	function mnist_fit_and_predict(optimizer, initializer, n_epoch)
	mlp = get_mnist_mlp()
	train_provider, eval_provider = get_mnist_data()

	# setup model
	model = mx.FeedForward(mlp, context = mx.cpu())

	# fit parameters
	cp_prefix = "mnist-test-cp"
	mx.fit(model, optimizer, train_provider, eval_data=eval_provider, n_epoch=n_epoch,
	initializer=initializer, callbacks=[mx.speedometer(), mx.do_checkpoint(cp_prefix, save_epoch_0=true)])

	# make sure the checkpoints are saved
	@test isfile("$cp_prefix-symbol.json")
	for i_epoch = 0:n_epoch
	@test isfile(mx.format("{1}-{2:04d}.params", cp_prefix, i_epoch))
	end
	mlp_load = mx.load("$cp_prefix-symbol.json", mx.SymbolicNode)
	@test mx.to_json(mlp_load) == mx.to_json(mlp)
	mlp_load = mx.from_json(read("$cp_prefix-symbol.json", String), mx.SymbolicNode)
	@test mx.to_json(mlp_load) == mx.to_json(mlp)

	#--------------------------------------------------------------------------------
	# the predict API
	probs = mx.predict(model, eval_provider)

	# collect all labels from eval data
	labels = Array[]
	for batch in eval_provider
	push!(labels, copy(mx.get(eval_provider, batch, :softmax_label)))
	end
	labels = cat(labels..., dims = 1)

	# Now we use compute the accuracy
	correct = 0
	for i = 1:length(labels)
	# labels are 0...9
	if argmax(probs[:,i]) == labels[i]+1
	correct += 1
	end
	end
	accuracy = 100correct/length(labels)
	println(mx.format("Accuracy on eval set: {1:.2f}%", accuracy))

	# try to call visualization
	dot_code = mx.to_graphviz(mlp)

	return accuracy
	end

	function test_mnist_mlp()
	@info("MNIST::SGD")
	@test mnist_fit_and_predict(mx.SGD(η=.2), mx.UniformInitializer(.01), 2) > 90

	@info("MNIST::SGD::η scheduler")
	@test mnist_fit_and_predict(mx.SGD(η_sched=mx.LearningRate.Inv(.25)),
	mx.UniformInitializer(.01), 2) > 90

	@info("MNIST::SGD::momentum μ")
	@test mnist_fit_and_predict(mx.SGD(η=.1, μ=.9), mx.UniformInitializer(.01), 2) > 90

	@info("MNIST::ADAM")
	@test mnist_fit_and_predict(mx.ADAM(), mx.NormalInitializer(), 2) > 90

	@info("MNIST::AdaGrad")
	@test mnist_fit_and_predict(mx.AdaGrad(), mx.NormalInitializer(), 2) > 90

	@info("MNIST::AdaDelta")
	@test mnist_fit_and_predict(mx.AdaDelta(), mx.NormalInitializer(), 2) > 90

	@info("MNIST::AdaMax")
	@test mnist_fit_and_predict(mx.AdaMax(), mx.NormalInitializer(), 2) > 90

	@info("MNIST::RMSProp")
	@test mnist_fit_and_predict(mx.RMSProp(), mx.NormalInitializer(), 2) > 90

	@info("MNIST::Nadam")
	@test mnist_fit_and_predict(mx.Nadam(), mx.NormalInitializer(), 2) > 90
	end

	test_mnist_mlp()

	end # module MNISTTest