3rdparty/mshadow/guide/basic.cpp - mxnet - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 // header file to use mshadow
 #include "mshadow/tensor.h"
 // this namespace contains all data structures, functions
 using namespace mshadow;
 // this namespace contains all operator overloads
 using namespace mshadow::expr;

 int main(void) {
   // intialize tensor engine before using tensor operation, needed for CuBLAS
   InitTensorEngine<cpu>();
   // assume we have a float space
   float data[20];
   // create a 2 x 5 x 2 tensor, from existing space
   Tensor<cpu, 3> ts(data, Shape3(2,5,2));
   // take first subscript of the tensor
   Tensor<cpu, 2> mat = ts[0];
   // Tensor object is only a handle, assignment means they have same data content
   // we can specify content type of a Tensor, if not specified, it is float bydefault
   Tensor<cpu, 2, float> mat2 = mat;
   mat = Tensor<cpu, 1>(data, Shape1(10)).FlatTo2D();

   // shaape of matrix, note size order is same as numpy
   printf("%u X %u matrix\n", mat.size(0), mat.size(1));

   // initialize all element to zero
   mat = 0.0f;
   // assign some values
   mat[0][1] = 1.0f; mat[1][0] = 2.0f;
   // elementwise operations
   mat += (mat + 10.0f) / 10.0f + 2.0f;

   // print out matrix, note: mat2 and mat1 are handles(pointers)
   for (index_t i = 0; i < mat.size(0); ++i) {
     for (index_t j = 0; j < mat.size(1); ++j) {
       printf("%.2f ", mat2[i][j]);
     }
     printf("\n");
   }

   TensorContainer<cpu, 2> lhs(Shape2(2, 3)), rhs(Shape2(2, 3)), ret(Shape2(2,2));
   lhs = 1.0;
   rhs = 1.0;
   ret = implicit_dot(lhs, rhs.T());
   VectorDot(ret[0].Slice(0, 1), lhs[0], rhs[0]);
   printf("vdot=%f\n", ret[0][0]);
   int cnt = 0;
   for (index_t i = 0; i < ret.size(0); ++i) {
     for (index_t j = 0; j < ret.size(1); ++j) {
       printf("%.2f ", ret[i][j]);
     }
     printf("\n");
   }

   printf("\n");

   for (index_t i = 0; i < lhs.size(0); ++i) {
     for (index_t j = 0; j < lhs.size(1); ++j) {
       lhs[i][j] = cnt++;
       printf("%.2f ", lhs[i][j]);
     }
     printf("\n");
   }
   printf("\n");
   TensorContainer<cpu, 1> index(Shape1(2)), choosed(Shape1(2));
   index[0] = 1; index[1] = 2;
   choosed = mat_choose_row_element(lhs, index);
   for (index_t i = 0; i < choosed.size(0); ++i) {
     printf("%.2f ", choosed[i]);
   }
   printf("\n");

   TensorContainer<cpu, 2> recover_lhs(Shape2(2, 3)), small_mat(Shape2(2, 3));
   small_mat = -100.0f;
   recover_lhs = mat_fill_row_element(small_mat, choosed, index);
   for (index_t i = 0; i < recover_lhs.size(0); ++i) {
     for (index_t j = 0; j < recover_lhs.size(1); ++j) {
       printf("%.2f ", recover_lhs[i][j] - lhs[i][j]);
     }
   }
   printf("\n");

   rhs = one_hot_encode(index, 3);

   for (index_t i = 0; i < lhs.size(0); ++i) {
     for (index_t j = 0; j < lhs.size(1); ++j) {
       printf("%.2f ", rhs[i][j]);
     }
     printf("\n");
   }
   printf("\n");
   TensorContainer<cpu, 1> idx(Shape1(3));
   idx[0] = 8;
   idx[1] = 0;
   idx[2] = 1;

   TensorContainer<cpu, 2> weight(Shape2(10, 5));
   TensorContainer<cpu, 2> embed(Shape2(3, 5));

   for (index_t i = 0; i < weight.size(0); ++i) {
     for (index_t j = 0; j < weight.size(1); ++j) {
       weight[i][j] = i;
     }
   }
   embed = take(idx, weight);
   for (index_t i = 0; i < embed.size(0); ++i) {
     for (index_t j = 0; j < embed.size(1); ++j) {
       printf("%.2f ", embed[i][j]);
     }
     printf("\n");
   }
   printf("\n\n");
   weight = take_grad(idx, embed, 10);
   for (index_t i = 0; i < weight.size(0); ++i) {
     for (index_t j = 0; j < weight.size(1); ++j) {
       printf("%.2f ", weight[i][j]);
     }
     printf("\n");
   }

   printf("upsampling\n");
   TensorContainer<cpu, 2> small(Shape2(2, 2));
   small[0][0] = 1.0f;
   small[0][1] = 2.0f;
   small[1][0] = 3.0f;
   small[1][1] = 4.0f;
   TensorContainer<cpu, 2> large(Shape2(6, 6));
   large = upsampling_nearest(small, 3);
   for (index_t i = 0; i < large.size(0); ++i) {
     for (index_t j = 0; j < large.size(1); ++j) {
       printf("%.2f ", large[i][j]);
     }
     printf("\n");
   }
   small = pool<red::sum>(large, small.shape_, 3, 3, 3, 3);
   // shutdown tensor enigne after usage
   for (index_t i = 0; i < small.size(0); ++i) {
     for (index_t j = 0; j < small.size(1); ++j) {
       printf("%.2f ", small[i][j]);
     }
     printf("\n");
   }

   printf("mask\n");
   TensorContainer<cpu, 2> mask_data(Shape2(6, 8));
   TensorContainer<cpu, 2> mask_out(Shape2(6, 8));
   TensorContainer<cpu, 1> mask_src(Shape1(6));

   mask_data = 1.0f;
   for (int i = 0; i < 6; ++i) {
     mask_src[i] = static_cast<float>(i);
   }
   mask_out = mask(mask_src, mask_data);
   for (index_t i = 0; i < mask_out.size(0); ++i) {
     for (index_t j = 0; j < mask_out.size(1); ++j) {
       printf("%.2f ", mask_out[i][j]);
     }
     printf("\n");
   }
   ShutdownTensorEngine<cpu>();
   return 0;
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one
	* or more contributor license agreements. See the NOTICE file
	* distributed with this work for additional information
	* regarding copyright ownership. The ASF licenses this file
	* to you under the Apache License, Version 2.0 (the
	* "License"); you may not use this file except in compliance
	* with the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing,
	* software distributed under the License is distributed on an
	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	* KIND, either express or implied. See the License for the
	* specific language governing permissions and limitations
	* under the License.
	*/

	// header file to use mshadow
	#include "mshadow/tensor.h"
	// this namespace contains all data structures, functions
	using namespace mshadow;
	// this namespace contains all operator overloads
	using namespace mshadow::expr;

	int main(void) {
	// intialize tensor engine before using tensor operation, needed for CuBLAS
	InitTensorEngine<cpu>();
	// assume we have a float space
	float data[20];
	// create a 2 x 5 x 2 tensor, from existing space
	Tensor<cpu, 3> ts(data, Shape3(2,5,2));
	// take first subscript of the tensor
	Tensor<cpu, 2> mat = ts[0];
	// Tensor object is only a handle, assignment means they have same data content
	// we can specify content type of a Tensor, if not specified, it is float bydefault
	Tensor<cpu, 2, float> mat2 = mat;
	mat = Tensor<cpu, 1>(data, Shape1(10)).FlatTo2D();

	// shaape of matrix, note size order is same as numpy
	printf("%u X %u matrix\n", mat.size(0), mat.size(1));

	// initialize all element to zero
	mat = 0.0f;
	// assign some values
	mat[0][1] = 1.0f; mat[1][0] = 2.0f;
	// elementwise operations
	mat += (mat + 10.0f) / 10.0f + 2.0f;

	// print out matrix, note: mat2 and mat1 are handles(pointers)
	for (index_t i = 0; i < mat.size(0); ++i) {
	for (index_t j = 0; j < mat.size(1); ++j) {
	printf("%.2f ", mat2[i][j]);
	}
	printf("\n");
	}

	TensorContainer<cpu, 2> lhs(Shape2(2, 3)), rhs(Shape2(2, 3)), ret(Shape2(2,2));
	lhs = 1.0;
	rhs = 1.0;
	ret = implicit_dot(lhs, rhs.T());
	VectorDot(ret[0].Slice(0, 1), lhs[0], rhs[0]);
	printf("vdot=%f\n", ret[0][0]);
	int cnt = 0;
	for (index_t i = 0; i < ret.size(0); ++i) {
	for (index_t j = 0; j < ret.size(1); ++j) {
	printf("%.2f ", ret[i][j]);
	}
	printf("\n");
	}

	printf("\n");

	for (index_t i = 0; i < lhs.size(0); ++i) {
	for (index_t j = 0; j < lhs.size(1); ++j) {
	lhs[i][j] = cnt++;
	printf("%.2f ", lhs[i][j]);
	}
	printf("\n");
	}
	printf("\n");
	TensorContainer<cpu, 1> index(Shape1(2)), choosed(Shape1(2));
	index[0] = 1; index[1] = 2;
	choosed = mat_choose_row_element(lhs, index);
	for (index_t i = 0; i < choosed.size(0); ++i) {
	printf("%.2f ", choosed[i]);
	}
	printf("\n");

	TensorContainer<cpu, 2> recover_lhs(Shape2(2, 3)), small_mat(Shape2(2, 3));
	small_mat = -100.0f;
	recover_lhs = mat_fill_row_element(small_mat, choosed, index);
	for (index_t i = 0; i < recover_lhs.size(0); ++i) {
	for (index_t j = 0; j < recover_lhs.size(1); ++j) {
	printf("%.2f ", recover_lhs[i][j] - lhs[i][j]);
	}
	}
	printf("\n");

	rhs = one_hot_encode(index, 3);

	for (index_t i = 0; i < lhs.size(0); ++i) {
	for (index_t j = 0; j < lhs.size(1); ++j) {
	printf("%.2f ", rhs[i][j]);
	}
	printf("\n");
	}
	printf("\n");
	TensorContainer<cpu, 1> idx(Shape1(3));
	idx[0] = 8;
	idx[1] = 0;
	idx[2] = 1;

	TensorContainer<cpu, 2> weight(Shape2(10, 5));
	TensorContainer<cpu, 2> embed(Shape2(3, 5));

	for (index_t i = 0; i < weight.size(0); ++i) {
	for (index_t j = 0; j < weight.size(1); ++j) {
	weight[i][j] = i;
	}
	}
	embed = take(idx, weight);
	for (index_t i = 0; i < embed.size(0); ++i) {
	for (index_t j = 0; j < embed.size(1); ++j) {
	printf("%.2f ", embed[i][j]);
	}
	printf("\n");
	}
	printf("\n\n");
	weight = take_grad(idx, embed, 10);
	for (index_t i = 0; i < weight.size(0); ++i) {
	for (index_t j = 0; j < weight.size(1); ++j) {
	printf("%.2f ", weight[i][j]);
	}
	printf("\n");
	}

	printf("upsampling\n");
	TensorContainer<cpu, 2> small(Shape2(2, 2));
	small[0][0] = 1.0f;
	small[0][1] = 2.0f;
	small[1][0] = 3.0f;
	small[1][1] = 4.0f;
	TensorContainer<cpu, 2> large(Shape2(6, 6));
	large = upsampling_nearest(small, 3);
	for (index_t i = 0; i < large.size(0); ++i) {
	for (index_t j = 0; j < large.size(1); ++j) {
	printf("%.2f ", large[i][j]);
	}
	printf("\n");
	}
	small = pool<red::sum>(large, small.shape_, 3, 3, 3, 3);
	// shutdown tensor enigne after usage
	for (index_t i = 0; i < small.size(0); ++i) {
	for (index_t j = 0; j < small.size(1); ++j) {
	printf("%.2f ", small[i][j]);
	}
	printf("\n");
	}

	printf("mask\n");
	TensorContainer<cpu, 2> mask_data(Shape2(6, 8));
	TensorContainer<cpu, 2> mask_out(Shape2(6, 8));
	TensorContainer<cpu, 1> mask_src(Shape1(6));

	mask_data = 1.0f;
	for (int i = 0; i < 6; ++i) {
	mask_src[i] = static_cast<float>(i);
	}
	mask_out = mask(mask_src, mask_data);
	for (index_t i = 0; i < mask_out.size(0); ++i) {
	for (index_t j = 0; j < mask_out.size(1); ++j) {
	printf("%.2f ", mask_out[i][j]);
	}
	printf("\n");
	}
	ShutdownTensorEngine<cpu>();
	return 0;
	}