tests/python/codegen/test_target_codegen_blob.py - tvm - Git at Google

 # Licensed to the Apache Software Foundation (ASF) under one
 # or more contributor license agreements.  See the NOTICE file
 # distributed with this work for additional information
 # regarding copyright ownership.  The ASF licenses this file
 # to you under the Apache License, Version 2.0 (the
 # "License"); you may not use this file except in compliance
 # with the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing,
 # software distributed under the License is distributed on an
 # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 # KIND, either express or implied.  See the License for the
 # specific language governing permissions and limitations
 # under the License.

 import ctypes
 import numpy as np
 from tvm import relay
 import tvm.relay.testing
 from tvm.contrib import graph_executor, cc, utils, popen_pool, tar
 import tvm
 import tvm.testing
 from tvm.script import ir as I, tir as T


 @tvm.testing.uses_gpu
 def test_synthetic():
     for device in ["llvm", "cuda"]:
         if not tvm.testing.device_enabled(device):
             print("skip because %s is not enabled..." % device)
             return

     input_shape = (1, 5, 23, 61)

     def verify(data):
         mod, params = relay.testing.synthetic.get_workload(input_shape=input_shape)
         with tvm.transform.PassContext(opt_level=3):
             lib = relay.build_module.build(mod, "llvm", params=params)
         dev = tvm.cpu()
         module = graph_executor.GraphModule(lib["default"](dev))
         module.set_input("data", data)
         module.run()
         out = module.get_output(0).numpy()
         return out

     synthetic_mod, synthetic_params = relay.testing.synthetic.get_workload(input_shape=input_shape)
     with tvm.transform.PassContext(opt_level=3):
         synthetic_gpu_lib = relay.build_module.build(synthetic_mod, "cuda", params=synthetic_params)

     temp = utils.tempdir()
     path_lib = temp.relpath("deploy_lib.so")
     synthetic_gpu_lib.export_library(path_lib)

     loaded_lib = tvm.runtime.load_module(path_lib)
     data = np.random.uniform(-1, 1, size=input_shape).astype("float32")
     dev = tvm.cuda()
     module = graph_executor.GraphModule(loaded_lib["default"](dev))
     module.set_input("data", data)
     module.run()
     out = module.get_output(0).numpy()

     tvm.testing.assert_allclose(out, verify(data), atol=1e-5)


 @tvm.testing.uses_gpu
 def test_cuda_multi_lib():
     # test combining two system lib together
     # each contains a fatbin component in cuda
     dev = tvm.cuda(0)
     for device in ["llvm", "cuda"]:
         if not tvm.testing.device_enabled(device):
             print("skip because %s is not enabled..." % device)
             return

     @tvm.script.ir_module
     class ModA:
         I.module_attrs({"system_lib_prefix": "modA_"})

         @T.prim_func
         def my_inplace_update(x: T.Buffer((12), "float32")) -> None:
             T.func_attr({"global_symbol": "modA_my_inplace_update"})
             for bx in T.thread_binding(T.int64(1), thread="blockIdx.x"):
                 for tx in T.thread_binding(T.int64(12), thread="threadIdx.x"):
                     x[tx] = x[tx] + 1

     @tvm.script.ir_module
     class ModB:
         I.module_attrs({"system_lib_prefix": "modB_"})

         @T.prim_func
         def my_inplace_update(x: T.Buffer((12), "float32")) -> None:
             T.func_attr({"global_symbol": "modB_my_inplace_update"})
             for bx in T.thread_binding(T.int64(1), thread="blockIdx.x"):
                 for tx in T.thread_binding(T.int64(12), thread="threadIdx.x"):
                     x[tx] = x[tx] + 2

     temp = utils.tempdir()
     target = tvm.target.Target("cuda", host="llvm")
     libA = tvm.build(ModA, target=target)
     libB = tvm.build(ModB, target=target)

     pathA = temp.relpath("libA.tar")
     pathB = temp.relpath("libB.tar")
     pathAll = temp.relpath("libAll.a")

     path_dso = temp.relpath("mylib.so")
     libA.export_library(pathA, fcompile=tar.tar)
     libB.export_library(pathB, fcompile=tar.tar)
     cc.create_staticlib(pathAll, [pathA, pathB])
     # package two static libs together
     cc.create_shared(path_dso, ["-Wl,--whole-archive", pathAll, "-Wl,--no-whole-archive"])

     def popen_check():
         # Load dll, will trigger system library registration
         ctypes.CDLL(path_dso)
         # Load the system wide library
         dev = tvm.cuda()
         a_np = np.random.uniform(size=12).astype("float32")
         a_nd = tvm.nd.array(a_np, dev)
         b_nd = tvm.nd.array(a_np, dev)
         syslibA = tvm.runtime.system_lib("modA_")
         syslibB = tvm.runtime.system_lib("modB_")
         # reload same lib twice
         syslibA = tvm.runtime.system_lib("modA_")
         syslibA["my_inplace_update"](a_nd)
         syslibB["my_inplace_update"](b_nd)
         np.testing.assert_equal(a_nd.numpy(), a_np + 1)
         np.testing.assert_equal(b_nd.numpy(), a_np + 2)

     # system lib should be loaded in different process
     worker = popen_pool.PopenWorker()
     worker.send(popen_check)
     worker.recv()


 if __name__ == "__main__":
     test_synthetic()
     test_cuda_multilib()
	# Licensed to the Apache Software Foundation (ASF) under one
	# or more contributor license agreements. See the NOTICE file
	# distributed with this work for additional information
	# regarding copyright ownership. The ASF licenses this file
	# to you under the Apache License, Version 2.0 (the
	# "License"); you may not use this file except in compliance
	# with the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing,
	# software distributed under the License is distributed on an
	# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
	# KIND, either express or implied. See the License for the
	# specific language governing permissions and limitations
	# under the License.

	import ctypes
	import numpy as np
	from tvm import relay
	import tvm.relay.testing
	from tvm.contrib import graph_executor, cc, utils, popen_pool, tar
	import tvm
	import tvm.testing
	from tvm.script import ir as I, tir as T


	@tvm.testing.uses_gpu
	def test_synthetic():
	for device in ["llvm", "cuda"]:
	if not tvm.testing.device_enabled(device):
	print("skip because %s is not enabled..." % device)
	return

	input_shape = (1, 5, 23, 61)

	def verify(data):
	mod, params = relay.testing.synthetic.get_workload(input_shape=input_shape)
	with tvm.transform.PassContext(opt_level=3):
	lib = relay.build_module.build(mod, "llvm", params=params)
	dev = tvm.cpu()
	module = graph_executor.GraphModule(lib["default"](dev))
	module.set_input("data", data)
	module.run()
	out = module.get_output(0).numpy()
	return out

	synthetic_mod, synthetic_params = relay.testing.synthetic.get_workload(input_shape=input_shape)
	with tvm.transform.PassContext(opt_level=3):
	synthetic_gpu_lib = relay.build_module.build(synthetic_mod, "cuda", params=synthetic_params)

	temp = utils.tempdir()
	path_lib = temp.relpath("deploy_lib.so")
	synthetic_gpu_lib.export_library(path_lib)

	loaded_lib = tvm.runtime.load_module(path_lib)
	data = np.random.uniform(-1, 1, size=input_shape).astype("float32")
	dev = tvm.cuda()
	module = graph_executor.GraphModule(loaded_lib["default"](dev))
	module.set_input("data", data)
	module.run()
	out = module.get_output(0).numpy()

	tvm.testing.assert_allclose(out, verify(data), atol=1e-5)


	@tvm.testing.uses_gpu
	def test_cuda_multi_lib():
	# test combining two system lib together
	# each contains a fatbin component in cuda
	dev = tvm.cuda(0)
	for device in ["llvm", "cuda"]:
	if not tvm.testing.device_enabled(device):
	print("skip because %s is not enabled..." % device)
	return

	@tvm.script.ir_module
	class ModA:
	I.module_attrs({"system_lib_prefix": "modA_"})

	@T.prim_func
	def my_inplace_update(x: T.Buffer((12), "float32")) -> None:
	T.func_attr({"global_symbol": "modA_my_inplace_update"})
	for bx in T.thread_binding(T.int64(1), thread="blockIdx.x"):
	for tx in T.thread_binding(T.int64(12), thread="threadIdx.x"):
	x[tx] = x[tx] + 1

	@tvm.script.ir_module
	class ModB:
	I.module_attrs({"system_lib_prefix": "modB_"})

	@T.prim_func
	def my_inplace_update(x: T.Buffer((12), "float32")) -> None:
	T.func_attr({"global_symbol": "modB_my_inplace_update"})
	for bx in T.thread_binding(T.int64(1), thread="blockIdx.x"):
	for tx in T.thread_binding(T.int64(12), thread="threadIdx.x"):
	x[tx] = x[tx] + 2

	temp = utils.tempdir()
	target = tvm.target.Target("cuda", host="llvm")
	libA = tvm.build(ModA, target=target)
	libB = tvm.build(ModB, target=target)

	pathA = temp.relpath("libA.tar")
	pathB = temp.relpath("libB.tar")
	pathAll = temp.relpath("libAll.a")

	path_dso = temp.relpath("mylib.so")
	libA.export_library(pathA, fcompile=tar.tar)
	libB.export_library(pathB, fcompile=tar.tar)
	cc.create_staticlib(pathAll, [pathA, pathB])
	# package two static libs together
	cc.create_shared(path_dso, ["-Wl,--whole-archive", pathAll, "-Wl,--no-whole-archive"])

	def popen_check():
	# Load dll, will trigger system library registration
	ctypes.CDLL(path_dso)
	# Load the system wide library
	dev = tvm.cuda()
	a_np = np.random.uniform(size=12).astype("float32")
	a_nd = tvm.nd.array(a_np, dev)
	b_nd = tvm.nd.array(a_np, dev)
	syslibA = tvm.runtime.system_lib("modA_")
	syslibB = tvm.runtime.system_lib("modB_")
	# reload same lib twice
	syslibA = tvm.runtime.system_lib("modA_")
	syslibA["my_inplace_update"](a_nd)
	syslibB["my_inplace_update"](b_nd)
	np.testing.assert_equal(a_nd.numpy(), a_np + 1)
	np.testing.assert_equal(b_nd.numpy(), a_np + 2)

	# system lib should be loaded in different process
	worker = popen_pool.PopenWorker()
	worker.send(popen_check)
	worker.recv()


	if __name__ == "__main__":
	test_synthetic()
	test_cuda_multilib()