24 #ifndef TVM_RUNTIME_TENSOR_H_
25 #define TVM_RUNTIME_TENSOR_H_
27 #include <tvm/ffi/container/shape.h>
28 #include <tvm/ffi/container/tensor.h>
29 #include <tvm/ffi/optional.h>
30 #include <tvm/ffi/string.h>
45 using ffi::GetDataSize;
47 using ffi::IsContiguous;
53 class Tensor :
public tvm::ffi::Tensor {
75 return tvm::ffi::Tensor::FromDLPackVersioned(tensor,
kAllocAlignment,
true);
83 inline void CopyFrom(
const DLTensor* other);
99 inline void CopyTo(DLTensor* other)
const;
117 ffi::Optional<ffi::String> mem_scope = std::nullopt)
const;
123 inline bool Load(dmlc::Stream* stream);
128 inline void Save(dmlc::Stream* stream)
const;
151 uint64_t relative_byte_offset = 0)
const;
161 ffi::Optional<ffi::String> mem_scope = std::nullopt);
168 TVM_DLL
static void CopyFromTo(
const DLTensor* from, DLTensor* to,
178 TVM_DLL
static void CopyToBytes(
const DLTensor* from,
void* to,
size_t nbytes,
187 inline bool SaveDLTensor(dmlc::Stream* strm,
const DLTensor* tensor);
190 ICHECK(data_ !=
nullptr);
195 ICHECK(data_ !=
nullptr);
196 ICHECK(other.data_ !=
nullptr);
197 CopyFromTo(other.get_mutable(), get_mutable());
201 ICHECK(data_ !=
nullptr);
206 ICHECK(data_ !=
nullptr);
207 ICHECK(other.data_ !=
nullptr);
208 CopyFromTo(get_mutable(), other.get_mutable());
217 strm->Write(reserved);
228 cpu_dev.device_type = kDLCPU;
229 cpu_dev.device_id = 0;
230 strm->Write(cpu_dev);
231 strm->Write(tensor->ndim);
232 strm->Write(tensor->dtype);
233 int ndim = tensor->ndim;
234 strm->WriteArray(tensor->shape, ndim);
235 int type_bytes = (tensor->dtype.bits + 7) / 8;
236 int64_t num_elems = 1;
237 for (
int i = 0; i < ndim; ++i) {
238 num_elems *= tensor->shape[i];
240 int64_t data_byte_size = type_bytes * num_elems;
241 strm->Write(data_byte_size);
243 if (DMLC_IO_NO_ENDIAN_SWAP && tensor->device.device_type == kDLCPU &&
244 ffi::IsContiguous(*tensor) && tensor->byte_offset == 0) {
246 strm->Write(tensor->data, data_byte_size);
248 std::vector<uint8_t> bytes(data_byte_size);
250 if (!DMLC_IO_NO_ENDIAN_SWAP) {
251 dmlc::ByteSwap(dmlc::BeginPtr(bytes), type_bytes, num_elems);
253 strm->Write(dmlc::BeginPtr(bytes), data_byte_size);
261 uint64_t header, reserved;
262 ICHECK(strm->Read(&header)) <<
"Invalid DLTensor file format";
263 ICHECK(strm->Read(&reserved)) <<
"Invalid DLTensor file format";
268 ICHECK(strm->Read(&dev)) <<
"Invalid DLTensor file format";
269 ICHECK(strm->Read(&ndim)) <<
"Invalid DLTensor file format";
270 ICHECK(strm->Read(&dtype)) <<
"Invalid DLTensor file format";
271 ICHECK_EQ(dev.device_type, kDLCPU) <<
"Invalid DLTensor device: can only save as CPU tensor";
272 std::vector<int64_t>
shape(ndim);
274 ICHECK(strm->ReadArray(&
shape[0], ndim)) <<
"Invalid DLTensor file format";
277 int64_t num_elems = 1;
279 for (
int i = 0; i <
ret->ndim; ++i) {
280 num_elems *=
ret->shape[i];
282 int64_t data_byte_size;
283 ICHECK(strm->Read(&data_byte_size)) <<
"Invalid DLTensor file format";
284 ICHECK(data_byte_size == num_elems * elem_bytes) <<
"Invalid DLTensor file format";
285 auto read_ret = strm->Read(
ret->data, data_byte_size);
287 if (ndim > 0 &&
shape[0] != 0) {
288 ICHECK(read_ret) <<
"Invalid DLTensor file format";
290 if (!DMLC_IO_NO_ENDIAN_SWAP) {
291 dmlc::ByteSwap(
ret->data, elem_bytes, num_elems);
304 if (device.device_type == DLDeviceType::kDLCUDA) {
305 return Device{DLDeviceType::kDLCUDAHost, 0};
306 }
else if (device.device_type == DLDeviceType::kDLROCM) {
307 return Device{DLDeviceType::kDLROCMHost, 0};
310 return Device{DLDeviceType::kDLCPU, 0};
320 std::size_t operator()(
const tvm::Device& dev)
const {
321 return ((dev.device_id << 8) | dev.device_type);
328 return (lhs.device_type == rhs.device_type && lhs.device_id == rhs.device_id);
DataType dtype() const
Definition: expr.h:138
Runtime primitive data type.
Definition: data_type.h:47
int bits() const
Definition: data_type.h:115
Managed Tensor. The array is backed by reference counted blocks.
Definition: tensor.h:53
static Tensor FromDLPackVersioned(DLManagedTensorVersioned *tensor)
Definition: tensor.h:74
static Tensor Empty(ffi::Shape shape, DLDataType dtype, Device dev, ffi::Optional< ffi::String > mem_scope=std::nullopt)
Create an empty Tensor.
void CopyFrom(const DLTensor *other)
Copy data content from another array.
Definition: tensor.h:189
Tensor(ffi::UnsafeInit tag)
Definition: tensor.h:62
ffi::Shape Shape() const
Definition: tensor.h:66
void CopyTo(DLTensor *other) const
Copy data content into another array.
Definition: tensor.h:200
void CopyToBytes(void *data, size_t nbytes) const
Copy data content into another array.
Tensor(const ffi::Tensor &other)
Definition: tensor.h:64
Tensor(ffi::Tensor &&other)
Definition: tensor.h:63
runtime::DataType DataType() const
Definition: tensor.h:67
static Tensor FromDLPack(DLManagedTensor *tensor)
Definition: tensor.h:70
void Save(dmlc::Stream *stream) const
Save Tensor to stream.
Definition: tensor.h:258
Tensor(ObjectPtr< ffi::TensorObj > data)
constructor.
Definition: tensor.h:61
Tensor CopyTo(const Device &dev, ffi::Optional< ffi::String > mem_scope=std::nullopt) const
Copy the data to another device.
bool Load(dmlc::Stream *stream)
Load Tensor from stream.
Definition: tensor.h:260
ffi::TensorObj Container
Definition: tensor.h:55
void CopyFromBytes(const void *data, size_t nbytes)
Copy data content from a byte buffer.
Tensor CreateView(ffi::Shape shape, DLDataType dtype, uint64_t relative_byte_offset=0) const
Create a Tensor that shares the data memory with the current one.
static void CopyToBytes(const DLTensor *from, void *to, size_t nbytes, TVMStreamHandle stream=nullptr)
Function to copy data from one array to a byte buffer.
static void CopyFromTo(const DLTensor *from, DLTensor *to, TVMStreamHandle stream=nullptr)
Function to copy data from one array to another.
Abstract device memory management API.
void * TVMStreamHandle
The stream that is specific to device can be NULL, which indicates the default one.
Definition: device_api.h:37
Device GetPreferredHostDevice(Device device)
Get the preferred host device from the input device.
Definition: tensor.h:303
bool SaveDLTensor(dmlc::Stream *strm, const DLTensor *tensor)
Save a DLTensor to stream.
Definition: tensor.h:214
constexpr int kAllocAlignment
Number of bytes each allocation must align to.
Definition: device_api.h:111
constexpr uint64_t kTVMTensorMagic
Magic number for Tensor file.
Definition: tensor.h:212
Tensor shape(const Tensor &src, DataType dtype, const std::string name="T_shape", const std::string tag=kInjective)
Get the shape of input tensor.
Definition: transform.h:1960
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:37
PrimExpr ret(PrimExpr value, Span span=Span())
Return the value.
runtime::DataType DataType
Definition: data_type.h:458
DLDevice Device
Definition: device_api.h:42
A managed object in the TVM runtime.
Serializer extension to support TVM data types Include this file to enable serialization of DLDataTyp...