examples/autograd/mnist_cnn.py - singa - Git at Google

 #
 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.
 #

 import numpy as np
 import argparse
 import os

 from singa import device
 from singa import tensor
 from singa import autograd
 from singa import opt


 def load_data(path):
     f = np.load(path)
     x_train, y_train = f["x_train"], f["y_train"]
     x_test, y_test = f["x_test"], f["y_test"]
     f.close()
     return (x_train, y_train), (x_test, y_test)


 def to_categorical(y, num_classes):
     """
     Converts a class vector (integers) to binary class matrix.

     Args
         y: class vector to be converted into a matrix
             (integers from 0 to num_classes).
         num_classes: total number of classes.

     Return
         A binary matrix representation of the input.
     """
     y = np.array(y, dtype="int")
     n = y.shape[0]
     categorical = np.zeros((n, num_classes))
     categorical[np.arange(n), y] = 1
     categorical = categorical.astype(np.float32)
     return categorical


 def preprocess(data):
     data = data.astype(np.float32)
     data /= 255
     data = np.expand_dims(data, axis=1)
     return data


 def accuracy(pred, target):
     y = np.argmax(pred, axis=1)
     t = np.argmax(target, axis=1)
     a = y == t
     return np.array(a, "int").sum() / float(len(t))


 if __name__ == "__main__":

     parser = argparse.ArgumentParser(description="Train CNN over MNIST")
     parser.add_argument("file_path", type=str, help="the dataset path")
     parser.add_argument("--use_cpu", action="store_true")
     args = parser.parse_args()

     assert os.path.exists(
         args.file_path
     ), "Pls download the MNIST dataset from https://s3.amazonaws.com/img-datasets/mnist.npz"

     if args.use_cpu:
         print("Using CPU")
         dev = device.get_default_device()
     else:
         print("Using GPU")
         dev = device.create_cuda_gpu()

     train, test = load_data(args.file_path)

     batch_number = 600
     num_classes = 10
     epochs = 1

     sgd = opt.SGD(lr=0.01)

     x_train = preprocess(train[0])
     y_train = to_categorical(train[1], num_classes)

     x_test = preprocess(test[0])
     y_test = to_categorical(test[1], num_classes)
     print("the shape of training data is", x_train.shape)
     print("the shape of training label is", y_train.shape)
     print("the shape of testing data is", x_test.shape)
     print("the shape of testing label is", y_test.shape)

     # operations initialization
     conv1 = autograd.Conv2d(1, 32, 3, padding=1, bias=False)
     bn1 = autograd.BatchNorm2d(32)
     conv21 = autograd.Conv2d(32, 16, 3, padding=1)
     conv22 = autograd.Conv2d(32, 16, 3, padding=1)
     bn2 = autograd.BatchNorm2d(32)
     linear = autograd.Linear(32 * 28 * 28, 10)
     pooling1 = autograd.MaxPool2d(3, 1, padding=1)
     pooling2 = autograd.AvgPool2d(3, 1, padding=1)

     def forward(x, t):
         y = conv1(x)
         y = autograd.relu(y)
         y = bn1(y)
         y = pooling1(y)
         y1 = conv21(y)
         y2 = conv22(y)
         y = autograd.cat((y1, y2), 1)
         y = bn2(y)
         y = autograd.relu(y)
         y = bn2(y)
         y = pooling2(y)
         y = autograd.flatten(y)
         y = linear(y)
         loss = autograd.softmax_cross_entropy(y, t)
         return loss, y

     autograd.training = True
     for epoch in range(epochs):
         for i in range(batch_number):
             inputs = tensor.Tensor(
                 device=dev,
                 data=x_train[i * 100 : (1 + i) * 100],
                 stores_grad=False,
             )
             targets = tensor.Tensor(
                 device=dev,
                 data=y_train[i * 100 : (1 + i) * 100],
                 requires_grad=False,
                 stores_grad=False,
             )

             loss, y = forward(inputs, targets)

             accuracy_rate = accuracy(
                 tensor.to_numpy(y), tensor.to_numpy(targets)
             )
             if i % 5 == 0:
                 print(
                     "accuracy is:",
                     accuracy_rate,
                     "loss is:",
                     tensor.to_numpy(loss)[0],
                 )

             for p, gp in autograd.backward(loss):
                 sgd.update(p, gp)

             sgd.step()
	#
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.
	#

	import numpy as np
	import argparse
	import os

	from singa import device
	from singa import tensor
	from singa import autograd
	from singa import opt


	def load_data(path):
	f = np.load(path)
	x_train, y_train = f["x_train"], f["y_train"]
	x_test, y_test = f["x_test"], f["y_test"]
	f.close()
	return (x_train, y_train), (x_test, y_test)


	def to_categorical(y, num_classes):
	"""
	Converts a class vector (integers) to binary class matrix.

	Args
	y: class vector to be converted into a matrix
	(integers from 0 to num_classes).
	num_classes: total number of classes.

	Return
	A binary matrix representation of the input.
	"""
	y = np.array(y, dtype="int")
	n = y.shape[0]
	categorical = np.zeros((n, num_classes))
	categorical[np.arange(n), y] = 1
	categorical = categorical.astype(np.float32)
	return categorical


	def preprocess(data):
	data = data.astype(np.float32)
	data /= 255
	data = np.expand_dims(data, axis=1)
	return data


	def accuracy(pred, target):
	y = np.argmax(pred, axis=1)
	t = np.argmax(target, axis=1)
	a = y == t
	return np.array(a, "int").sum() / float(len(t))


	if __name__ == "__main__":

	parser = argparse.ArgumentParser(description="Train CNN over MNIST")
	parser.add_argument("file_path", type=str, help="the dataset path")
	parser.add_argument("--use_cpu", action="store_true")
	args = parser.parse_args()

	assert os.path.exists(
	args.file_path
	), "Pls download the MNIST dataset from https://s3.amazonaws.com/img-datasets/mnist.npz"

	if args.use_cpu:
	print("Using CPU")
	dev = device.get_default_device()
	else:
	print("Using GPU")
	dev = device.create_cuda_gpu()

	train, test = load_data(args.file_path)

	batch_number = 600
	num_classes = 10
	epochs = 1

	sgd = opt.SGD(lr=0.01)

	x_train = preprocess(train[0])
	y_train = to_categorical(train[1], num_classes)

	x_test = preprocess(test[0])
	y_test = to_categorical(test[1], num_classes)
	print("the shape of training data is", x_train.shape)
	print("the shape of training label is", y_train.shape)
	print("the shape of testing data is", x_test.shape)
	print("the shape of testing label is", y_test.shape)

	# operations initialization
	conv1 = autograd.Conv2d(1, 32, 3, padding=1, bias=False)
	bn1 = autograd.BatchNorm2d(32)
	conv21 = autograd.Conv2d(32, 16, 3, padding=1)
	conv22 = autograd.Conv2d(32, 16, 3, padding=1)
	bn2 = autograd.BatchNorm2d(32)
	linear = autograd.Linear(32 * 28 * 28, 10)
	pooling1 = autograd.MaxPool2d(3, 1, padding=1)
	pooling2 = autograd.AvgPool2d(3, 1, padding=1)

	def forward(x, t):
	y = conv1(x)
	y = autograd.relu(y)
	y = bn1(y)
	y = pooling1(y)
	y1 = conv21(y)
	y2 = conv22(y)
	y = autograd.cat((y1, y2), 1)
	y = bn2(y)
	y = autograd.relu(y)
	y = bn2(y)
	y = pooling2(y)
	y = autograd.flatten(y)
	y = linear(y)
	loss = autograd.softmax_cross_entropy(y, t)
	return loss, y

	autograd.training = True
	for epoch in range(epochs):
	for i in range(batch_number):
	inputs = tensor.Tensor(
	device=dev,
	data=x_train[i * 100 : (1 + i) * 100],
	stores_grad=False,
	)
	targets = tensor.Tensor(
	device=dev,
	data=y_train[i * 100 : (1 + i) * 100],
	requires_grad=False,
	stores_grad=False,
	)

	loss, y = forward(inputs, targets)

	accuracy_rate = accuracy(
	tensor.to_numpy(y), tensor.to_numpy(targets)
	)
	if i % 5 == 0:
	print(
	"accuracy is:",
	accuracy_rate,
	"loss is:",
	tensor.to_numpy(loss)[0],
	)

	for p, gp in autograd.backward(loss):
	sgd.update(p, gp)

	sgd.step()