blob: 6abd12252d1d8ee1c5b4e4ba3e2bb8ad24600965 [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
* \file
* \brief Support functions to be linked with wasm_runtime to provide
* PackedFunc callbacks in tvmjs.
* We do not need to link this file in standalone wasm.
// configurations for the dmlc log.
#define DMLC_LOG_DEBUG 0
#include <tvm/runtime/c_runtime_api.h>
#include <tvm/runtime/container.h>
#include <tvm/runtime/device_api.h>
#include <tvm/runtime/packed_func.h>
#include <tvm/runtime/registry.h>
#include "../../src/runtime/rpc/rpc_local_session.h"
extern "C" {
// --- Additional C API for the Wasm runtime ---
* \brief Allocate space aligned to 64 bit.
* \param size The size of the space.
* \return The allocated space.
TVM_DLL void* TVMWasmAllocSpace(int size);
* \brief Free the space allocated by TVMWasmAllocSpace.
* \param data The data pointer.
TVM_DLL void TVMWasmFreeSpace(void* data);
* \brief Create PackedFunc from a resource handle.
* \param resource_handle The handle to the resource.
* \param out The output PackedFunc.
* \sa TVMWasmPackedCFunc, TVMWasmPackedCFuncFinalizer
3A * \return 0 if success.
TVM_DLL int TVMWasmFuncCreateFromCFunc(void* resource_handle, TVMFunctionHandle* out);
// --- APIs to be implemented by the frontend. ---
* \brief Wasm frontend packed function caller.
* \param args The arguments
* \param type_codes The type codes of the arguments
* \param num_args Number of arguments.
* \param ret The return value handle.
* \param resource_handle The handle additional resouce handle from fron-end.
* \return 0 if success, -1 if failure happens, set error via TVMAPISetLastError.
extern int TVMWasmPackedCFunc(TVMValue* args, int* type_codes, int num_args, TVMRetValueHandle ret,
void* resource_handle);
* \brief Wasm frontend resource finalizer.
* \param resource_handle The pointer to the external resource.
extern void TVMWasmPackedCFuncFinalizer(void* resource_handle);
} // extern "C"
void* TVMWasmAllocSpace(int size) {
int num_count = (size + 7) / 8;
return new int64_t[num_count];
void TVMWasmFreeSpace(void* arr) { delete[] static_cast<int64_t*>(arr); }
int TVMWasmFuncCreateFromCFunc(void* resource_handle, TVMFunctionHandle* out) {
return TVMFuncCreateFromCFunc(TVMWasmPackedCFunc, resource_handle, TVMWasmPackedCFuncFinalizer,
namespace tvm {
namespace runtime {
// A special local session that can interact with async
// functions in the JS runtime.
class AsyncLocalSession : public LocalSession {
AsyncLocalSession() {}
PackedFuncHandle GetFunction(const std::string& name) final {
if (name == "runtime.RPCTimeEvaluator") {
return get_time_eval_placeholder_.get();
} else if (auto* fp = tvm::runtime::Registry::Get(name)) {
// return raw handle because the remote need to explicitly manage it.
return new PackedFunc(*fp);
} else if (auto* fp = tvm::runtime::Registry::Get("__async." + name)) {
auto* rptr = new PackedFunc(*fp);
return rptr;
} else {
return nullptr;
void FreeHandle(void* handle, int type_code) final {
if (type_code == kTVMPackedFuncHandle) {
auto it = async_func_set_.find(handle);
if (it != async_func_set_.end()) {
if (handle != get_time_eval_placeholder_.get()) {
LocalSession::FreeHandle(handle, type_code);
void AsyncCallFunc(PackedFuncHandle func, const TVMValue* arg_values, const int* arg_type_codes,
int num_args, FAsyncCallback callback) final {
auto it = async_func_set_.find(func);
if (it != async_func_set_.end()) {
PackedFunc packed_callback([callback, this](TVMArgs args, TVMRetValue*) {
int code = args[0];
TVMRetValue rv;
rv = args[1];
[&](TVMArgs encoded_args) { callback(RPCCode::kReturn, encoded_args); });
TVMRetValue temp;
std::vector<TVMValue> values(arg_values, arg_values + num_args);
std::vector<int> type_codes(arg_type_codes, arg_type_codes + num_args);
TVMArgsSetter setter(&values[0], &type_codes[0]);
// pass the callback as the last argument.
setter(num_args, packed_callback);
auto* pf = static_cast<PackedFunc*>(func);
pf->CallPacked(TVMArgs(,, num_args + 1), &temp);
} else if (func == get_time_eval_placeholder_.get()) {
// special handle time evaluator.
try {
TVMArgs args(arg_values, arg_type_codes, num_args);
PackedFunc retfunc =
this->GetTimeEvaluator(args[0], args[1], args[2], args[3], args[4], args[5], args[6]);
TVMRetValue rv;
rv = retfunc;
this->EncodeReturn(std::move(rv), [&](TVMArgs encoded_args) {
// mark as async.
callback(RPCCode::kReturn, encoded_args);
} catch (const std::runtime_error& e) {
this->SendException(callback, e.what());
} else {
LocalSession::AsyncCallFunc(func, arg_values, arg_type_codes, num_args, callback);
void AsyncCopyToRemote(void* local_from, size_t local_from_offset, void* remote_to,
size_t remote_to_offset, size_t nbytes, TVMContext remote_ctx_to,
DLDataType type_hint, FAsyncCallback on_complete) final {
TVMContext cpu_ctx;
cpu_ctx.device_type = kDLCPU;
cpu_ctx.device_id = 0;
try {
->CopyDataFromTo(local_from, local_from_offset, remote_to, remote_to_offset, nbytes,
cpu_ctx, remote_ctx_to, type_hint, nullptr);
this->AsyncStreamWait(remote_ctx_to, nullptr, on_complete);
} catch (const std::runtime_error& e) {
this->SendException(on_complete, e.what());
void AsyncCopyFromRemote(void* remote_from, size_t remote_from_offset, void* local_to,
size_t local_to_offset, size_t nbytes, TVMContext remote_ctx_from,
DLDataType type_hint, FAsyncCallback on_complete) final {
TVMContext cpu_ctx;
cpu_ctx.device_type = kDLCPU;
cpu_ctx.device_id = 0;
try {
->CopyDataFromTo(remote_from, remote_from_offset, local_to, local_to_offset, nbytes,
remote_ctx_from, cpu_ctx, type_hint, nullptr);
this->AsyncStreamWait(remote_ctx_from, nullptr, on_complete);
} catch (const std::runtime_error& e) {
this->SendException(on_complete, e.what());
void AsyncStreamWait(TVMContext ctx, TVMStreamHandle stream, FAsyncCallback on_complete) final {
if (ctx.device_type == kDLCPU) {
TVMValue value;
int32_t tcode = kTVMNullptr;
value.v_handle = nullptr;
on_complete(RPCCode::kReturn, TVMArgs(&value, &tcode, 1));
} else {
CHECK(ctx.device_type == static_cast<DLDeviceType>(kDLWebGPU));
if (async_wait_ == nullptr) {
async_wait_ = tvm::runtime::Registry::Get("__async.wasm.WebGPUWaitForTasks");
CHECK(async_wait_ != nullptr);
PackedFunc packed_callback([on_complete](TVMArgs args, TVMRetValue*) {
int code = args[0];
TVMArgs(args.values + 1, args.type_codes + 1, args.size() - 1));
bool IsAsync() const final { return true; }
std::unordered_set<void*> async_func_set_;
std::unique_ptr<PackedFunc> get_time_eval_placeholder_ = std::make_unique<PackedFunc>();
const PackedFunc* async_wait_{nullptr};
// time evaluator
PackedFunc GetTimeEvaluator(Optional<Module> opt_mod, std::string name, int device_type,
int device_id, int number, int repeat, int min_repeat_ms) {
TVMContext ctx;
ctx.device_type = static_cast<DLDeviceType>(device_type);
ctx.device_id = device_id;
if (opt_mod.defined()) {
Module m = opt_mod.value();
std::string tkey = m->type_key();
return WrapWasmTimeEvaluator(m.GetFunction(name, false), ctx, number, repeat, min_repeat_ms);
} else {
auto* pf = runtime::Registry::Get(name);
CHECK(pf != nullptr) << "Cannot find " << name << " in the global function";
return WrapWasmTimeEvaluator(*pf, ctx, number, repeat, min_repeat_ms);
// time evaluator
PackedFunc WrapWasmTimeEvaluator(PackedFunc pf, TVMContext ctx, int number, int repeat,
int min_repeat_ms) {
auto ftimer = [pf, ctx, number, repeat, min_repeat_ms](TVMArgs args, TVMRetValue* rv) {
// the function is a async function.
PackedFunc on_complete = args[args.size() - 1];
// keep argument alive in finvoke so that they
// can be used throughout the async benchmark
std::vector<TVMValue> values(args.values, args.values + args.size() - 1);
std::vector<int> type_codes(args.type_codes, args.type_codes + args.size() - 1);
auto finvoke = [pf, values, type_codes](int n) {
TVMRetValue temp;
TVMArgs invoke_args(,, values.size());
for (int i = 0; i < n; ++i) {
pf.CallPacked(invoke_args, &temp);
auto* time_exec = runtime::Registry::Get("__async.wasm.TimeExecution");
CHECK(time_exec != nullptr) << "Cannot find wasm.GetTimer in the global function";
(*time_exec)(TypedPackedFunc<void(int)>(finvoke), ctx, number, repeat, min_repeat_ms,
return PackedFunc(ftimer);
TVM_REGISTER_GLOBAL("wasm.LocalSession").set_body_typed([]() {
return CreateRPCSessionModule(std::make_shared<AsyncLocalSession>());
} // namespace runtime
} // namespace tvm