blob: a0da7fea1eb530975bcb716d5e38a26712f7c413 [file]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
/*!
* \file cuda_fallback_module.cc
* \brief CUDAFallbackModuleNode — codegen-time placeholder used when the CUDA
* runtime is not linked. Mirrors `CUDAModuleNode`'s save/load format
* byte-for-byte; see one-way comment in `SaveToBytes` below.
* Always compiled (independent of USE_CUDA); never registered as an
* FFI factory or loader.
*/
#include "cuda_fallback_module.h"
#include <tvm/ffi/extra/module.h>
#include <tvm/ffi/function.h>
#include <string>
#include <utility>
#include "../../support/bytes_io.h"
namespace tvm {
namespace target {
class CUDAFallbackModuleNode : public ffi::ModuleObj {
public:
CUDAFallbackModuleNode(ffi::Bytes code, ffi::String fmt,
ffi::Map<ffi::String, runtime::FunctionInfo> fmap,
ffi::Map<ffi::String, ffi::String> source)
: code_(std::move(code)),
fmt_(std::move(fmt)),
fmap_(std::move(fmap)),
source_(std::move(source)) {}
// Mirror the real module's kind so consumers cannot distinguish at the
// kind/api layer. Saved bytes load back as a real CUDAModuleNode on a
// CUDA-equipped receiver.
const char* kind() const final { return "cuda"; }
int GetPropertyMask() const final { return ffi::Module::kBinarySerializable; }
ffi::Optional<ffi::Function> GetFunction(const ffi::String& name) final {
TVM_FFI_THROW(RuntimeError)
<< "CUDA runtime is not linked into this build; cannot launch kernels. "
<< "Re-link with USE_CUDA=ON or load this module in a CUDA-equipped "
<< "environment via tvm.runtime.load_module.";
TVM_FFI_UNREACHABLE();
}
ffi::Bytes SaveToBytes() const final {
// NOTE: serialization format MUST remain byte-identical to
// CUDAModuleNode::SaveToBytes in src/runtime/cuda/cuda_module.cc (the
// source of truth). Both produce a kind="cuda" artifact that the loader
// (ffi.Module.load_from_bytes.cuda, registered only when USE_CUDA=ON)
// deserializes. If the real impl's format changes, mirror the change
// here. The dependency is one-way: this file follows; cuda_module.cc
// does not reference this file.
std::string buffer;
support::BytesOutStream stream(&buffer);
stream.Write(fmt_);
stream.Write(fmap_);
stream.Write(code_);
return ffi::Bytes(std::move(buffer));
}
ffi::String InspectSource(const ffi::String& format) const final {
if (format == fmt_) {
return ffi::String(code_.data(), code_.size());
}
if (auto it = source_.find(format); it != source_.end()) {
return (*it).second;
}
if (format.empty()) {
if (auto it = source_.find("cuda"); it != source_.end()) {
return (*it).second;
}
if (fmt_ == "ptx" || fmt_ == "cuda") {
return ffi::String(code_.data(), code_.size());
}
}
return ffi::String();
}
private:
// Whatever the codegen produced (raw CUDA source, PTX, cubin, fatbin).
ffi::Bytes code_;
// Format identifier ("cuda", "ptx", "cubin", "fatbin").
ffi::String fmt_;
// function information table.
ffi::Map<ffi::String, runtime::FunctionInfo> fmap_;
// In-memory source map for InspectSource — never serialized.
ffi::Map<ffi::String, ffi::String> source_;
};
ffi::Module CUDAFallbackModuleCreate(ffi::Bytes code, ffi::String fmt,
ffi::Map<ffi::String, runtime::FunctionInfo> fmap,
ffi::Map<ffi::String, ffi::String> source) {
auto n = ffi::make_object<CUDAFallbackModuleNode>(std::move(code), std::move(fmt),
std::move(fmap), std::move(source));
return ffi::Module(n);
}
} // namespace target
} // namespace tvm