api/doxygen/runtime_2tensor_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_RUNTIME_TENSOR_H_

 #define TVM_RUNTIME_TENSOR_H_


 #include <tvm/ffi/container/shape.h>

 #include <tvm/ffi/container/tensor.h>

 #include <tvm/ffi/optional.h>

 #include <tvm/ffi/string.h>

 #include <tvm/runtime/base.h>

 #include <tvm/runtime/data_type.h>

 #include <tvm/runtime/device_api.h>

 #include <tvm/runtime/object.h>

 #include <tvm/runtime/serializer.h>


 #include <atomic>

 #include <functional>

 #include <utility>

 #include <vector>


 namespace tvm {

 namespace runtime {


 using ffi::GetDataSize;

 using ffi::IsAligned;

 using ffi::IsContiguous;


 class Tensor : public tvm::ffi::Tensor {

  public:

   using Container = ffi::TensorObj;

   Tensor() = default;

   explicit Tensor(ObjectPtr<ffi::TensorObj> data) : tvm::ffi::Tensor(data) {}

   explicit Tensor(ffi::UnsafeInit tag) : tvm::ffi::Tensor(tag) {}

   Tensor(ffi::Tensor&& other) : tvm::ffi::Tensor(std::move(other)) {}  // NOLINT(*)

   Tensor(const ffi::Tensor& other) : tvm::ffi::Tensor(other) {}        // NOLINT(*)


   ffi::ShapeView Shape() const { return this->shape(); }

   runtime::DataType DataType() const { return runtime::DataType(this->dtype()); }


   // DLPack handling

   static Tensor FromDLPack(DLManagedTensor* tensor) {

     return tvm::ffi::Tensor::FromDLPack(tensor, kAllocAlignment, true);

   }


   static Tensor FromDLPackVersioned(DLManagedTensorVersioned* tensor) {

     return tvm::ffi::Tensor::FromDLPackVersioned(tensor, kAllocAlignment, true);

   }

   inline const DLTensor* operator->() const { return this->get(); }

   inline void CopyFrom(const DLTensor* other);

   inline void CopyFrom(const Tensor& other);

   TVM_DLL void CopyFromBytes(const void* data, size_t nbytes);

   inline void CopyTo(DLTensor* other) const;

   inline void CopyTo(const Tensor& other) const;

   TVM_DLL void CopyToBytes(void* data, size_t nbytes) const;

   TVM_DLL Tensor CopyTo(const Device& dev,

                         ffi::Optional<ffi::String> mem_scope = std::nullopt) const;

   inline bool Load(dmlc::Stream* stream);

   inline void Save(dmlc::Stream* stream) const;


   TVM_DLL Tensor CreateView(ffi::Shape shape, DLDataType dtype,

                             uint64_t relative_byte_offset = 0) const;

   TVM_DLL static Tensor Empty(ffi::Shape shape, DLDataType dtype, Device dev,

                               ffi::Optional<ffi::String> mem_scope = std::nullopt);

   TVM_DLL static void CopyFromTo(const DLTensor* from, DLTensor* to,

                                  TVMStreamHandle stream = nullptr);


   TVM_DLL static void CopyToBytes(const DLTensor* from, void* to, size_t nbytes,

                                   TVMStreamHandle stream = nullptr);

 };


 inline bool SaveDLTensor(dmlc::Stream* strm, const DLTensor* tensor);


 inline void Tensor::CopyFrom(const DLTensor* other) {

   ICHECK(data_ != nullptr);

   CopyFromTo(other, get_mutable());

 }


 inline void Tensor::CopyFrom(const Tensor& other) {

   ICHECK(data_ != nullptr);

   ICHECK(other.data_ != nullptr);

   CopyFromTo(other.get_mutable(), get_mutable());

 }


 inline void Tensor::CopyTo(DLTensor* other) const {

   ICHECK(data_ != nullptr);

   CopyFromTo(get_mutable(), other);

 }


 inline void Tensor::CopyTo(const Tensor& other) const {

   ICHECK(data_ != nullptr);

   ICHECK(other.data_ != nullptr);

   CopyFromTo(get_mutable(), other.get_mutable());

 }


 constexpr uint64_t kTVMTensorMagic = 0xDD5E40F096B4A13F;


 inline bool SaveDLTensor(dmlc::Stream* strm, const DLTensor* tensor) {

   uint64_t header = kTVMTensorMagic, reserved = 0;

   strm->Write(header);

   strm->Write(reserved);

   // Always save data as CPU context

   //

   // Parameters that get serialized should be in CPU by default.

   // So even the array's context is GPU, it will be stored as CPU array.

   // This is used to prevent case when another user loads the parameters

   // back on machine that do not have GPU or related context.

   //

   // We can always do array.CopyTo(target_dev) to get a corresponding

   // array in the target context.

   Device cpu_dev;

   cpu_dev.device_type = kDLCPU;

   cpu_dev.device_id = 0;

   strm->Write(cpu_dev);

   strm->Write(tensor->ndim);

   strm->Write(tensor->dtype);

   int ndim = tensor->ndim;

   strm->WriteArray(tensor->shape, ndim);

   int type_bytes = (tensor->dtype.bits + 7) / 8;

   int64_t num_elems = 1;

   for (int i = 0; i < ndim; ++i) {

     num_elems *= tensor->shape[i];

   }

   int64_t data_byte_size = type_bytes * num_elems;

   strm->Write(data_byte_size);


   if (DMLC_IO_NO_ENDIAN_SWAP && tensor->device.device_type == kDLCPU &&

       ffi::IsContiguous(*tensor) && tensor->byte_offset == 0) {

     // quick path

     strm->Write(tensor->data, data_byte_size);

   } else {

     std::vector<uint8_t> bytes(data_byte_size);

     Tensor::CopyToBytes(const_cast<DLTensor*>(tensor), dmlc::BeginPtr(bytes), data_byte_size);

     if (!DMLC_IO_NO_ENDIAN_SWAP) {

       dmlc::ByteSwap(dmlc::BeginPtr(bytes), type_bytes, num_elems);

     }

     strm->Write(dmlc::BeginPtr(bytes), data_byte_size);

   }

   return true;

 }


 inline void Tensor::Save(dmlc::Stream* strm) const { SaveDLTensor(strm, operator->()); }


 inline bool Tensor::Load(dmlc::Stream* strm) {

   uint64_t header, reserved;

   ICHECK(strm->Read(&header)) << "Invalid DLTensor file format";

   ICHECK(strm->Read(&reserved)) << "Invalid DLTensor file format";

   ICHECK(header == kTVMTensorMagic) << "Invalid DLTensor file format";

   Device dev;

   int ndim;

   DLDataType dtype;

   ICHECK(strm->Read(&dev)) << "Invalid DLTensor file format";

   ICHECK(strm->Read(&ndim)) << "Invalid DLTensor file format";

   ICHECK(strm->Read(&dtype)) << "Invalid DLTensor file format";

   ICHECK_EQ(dev.device_type, kDLCPU) << "Invalid DLTensor device: can only save as CPU tensor";

   std::vector<int64_t> shape(ndim);

   if (ndim != 0) {

     ICHECK(strm->ReadArray(&shape[0], ndim)) << "Invalid DLTensor file format";

   }

   Tensor ret = Tensor::Empty(ffi::Shape(shape), dtype, dev);

   int64_t num_elems = 1;

   int elem_bytes = (ret->dtype.bits + 7) / 8;

   for (int i = 0; i < ret->ndim; ++i) {

     num_elems *= ret->shape[i];

   }

   int64_t data_byte_size;

   ICHECK(strm->Read(&data_byte_size)) << "Invalid DLTensor file format";

   ICHECK(data_byte_size == num_elems * elem_bytes) << "Invalid DLTensor file format";

   auto read_ret = strm->Read(ret->data, data_byte_size);

   // Only check non-empty data

   if (ndim > 0 && shape[0] != 0) {

     ICHECK(read_ret) << "Invalid DLTensor file format";

   }

   if (!DMLC_IO_NO_ENDIAN_SWAP) {

     dmlc::ByteSwap(ret->data, elem_bytes, num_elems);

   }

   *this = ret;

   return true;

 }


 inline Device GetPreferredHostDevice(Device device) {

   if (device.device_type == DLDeviceType::kDLCUDA) {

     return Device{DLDeviceType::kDLCUDAHost, 0};

   } else if (device.device_type == DLDeviceType::kDLROCM) {

     return Device{DLDeviceType::kDLROCMHost, 0};

   } else {

     // Fallback to CPU.

     return Device{DLDeviceType::kDLCPU, 0};

   }

 }


 }  // namespace runtime

 }  // namespace tvm


 namespace std {

 template <>

 struct hash<tvm::Device> {

   std::size_t operator()(const tvm::Device& dev) const {

     return ((dev.device_id << 8) | dev.device_type);

   }

 };


 template <>

 struct equal_to<tvm::Device> {

   bool operator()(const tvm::Device& lhs, const tvm::Device& rhs) const {

     return (lhs.device_type == rhs.device_type && lhs.device_id == rhs.device_id);

   }

 };

 }  // namespace std


 #endif  // TVM_RUNTIME_TENSOR_H_

tvm::PrimExpr::dtype
DataType dtype() const
Definition: expr.h:138

tvm::runtime::DataType
Runtime primitive data type.
Definition: data_type.h:47

tvm::runtime::DataType::bits
int bits() const
Definition: data_type.h:115

tvm::runtime::Tensor
Managed Tensor. The array is backed by reference counted blocks.
Definition: tensor.h:53

tvm::runtime::Tensor::operator->
const DLTensor * operator->() const
Definition: tensor.h:77

tvm::runtime::Tensor::Tensor
Tensor()=default

tvm::runtime::Tensor::FromDLPackVersioned
static Tensor FromDLPackVersioned(DLManagedTensorVersioned *tensor)
Definition: tensor.h:74

tvm::runtime::Tensor::Empty
static Tensor Empty(ffi::Shape shape, DLDataType dtype, Device dev, ffi::Optional< ffi::String > mem_scope=std::nullopt)
Create an empty Tensor.

tvm::runtime::Tensor::CopyFrom
void CopyFrom(const DLTensor *other)
Copy data content from another array.
Definition: tensor.h:190

tvm::runtime::Tensor::Shape
ffi::ShapeView Shape() const
Definition: tensor.h:66

tvm::runtime::Tensor::Tensor
Tensor(ffi::UnsafeInit tag)
Definition: tensor.h:62

tvm::runtime::Tensor::CopyTo
void CopyTo(DLTensor *other) const
Copy data content into another array.
Definition: tensor.h:201

tvm::runtime::Tensor::CopyToBytes
void CopyToBytes(void *data, size_t nbytes) const
Copy data content into another array.

tvm::runtime::Tensor::Tensor
Tensor(const ffi::Tensor &other)
Definition: tensor.h:64

tvm::runtime::Tensor::Tensor
Tensor(ffi::Tensor &&other)
Definition: tensor.h:63

tvm::runtime::Tensor::DataType
runtime::DataType DataType() const
Definition: tensor.h:67

tvm::runtime::Tensor::FromDLPack
static Tensor FromDLPack(DLManagedTensor *tensor)
Definition: tensor.h:70

tvm::runtime::Tensor::Save
void Save(dmlc::Stream *stream) const
Save Tensor to stream.
Definition: tensor.h:259

tvm::runtime::Tensor::Tensor
Tensor(ObjectPtr< ffi::TensorObj > data)
constructor.
Definition: tensor.h:61

tvm::runtime::Tensor::CopyTo
Tensor CopyTo(const Device &dev, ffi::Optional< ffi::String > mem_scope=std::nullopt) const
Copy the data to another device.

tvm::runtime::Tensor::Load
bool Load(dmlc::Stream *stream)
Load Tensor from stream.
Definition: tensor.h:261

tvm::runtime::Tensor::Container
ffi::TensorObj Container
Definition: tensor.h:55

tvm::runtime::Tensor::CopyFromBytes
void CopyFromBytes(const void *data, size_t nbytes)
Copy data content from a byte buffer.

tvm::runtime::Tensor::CreateView
Tensor CreateView(ffi::Shape shape, DLDataType dtype, uint64_t relative_byte_offset=0) const
Create a Tensor that shares the data memory with the current one.

tvm::runtime::Tensor::CopyToBytes
static void CopyToBytes(const DLTensor *from, void *to, size_t nbytes, TVMStreamHandle stream=nullptr)
Function to copy data from one array to a byte buffer.

tvm::runtime::Tensor::CopyFromTo
static void CopyFromTo(const DLTensor *from, DLTensor *to, TVMStreamHandle stream=nullptr)
Function to copy data from one array to another.

data_type.h

device_api.h
Abstract device memory management API.

TVMStreamHandle
void * TVMStreamHandle
The stream that is specific to device can be NULL, which indicates the default one.
Definition: device_api.h:37

tvm::runtime::GetPreferredHostDevice
Device GetPreferredHostDevice(Device device)
Get the preferred host device from the input device.
Definition: tensor.h:304

tvm::runtime::SaveDLTensor
bool SaveDLTensor(dmlc::Stream *strm, const DLTensor *tensor)
Save a DLTensor to stream.
Definition: tensor.h:215

tvm::runtime::kAllocAlignment
constexpr int kAllocAlignment
Number of bytes each allocation must align to.
Definition: device_api.h:111

tvm::runtime::kTVMTensorMagic
constexpr uint64_t kTVMTensorMagic
Magic number for Tensor file.
Definition: tensor.h:213

tvm::topi::shape
Tensor shape(const Tensor &src, DataType dtype, const std::string name="T_shape", const std::string tag=kInjective)
Get the shape of input tensor.
Definition: transform.h:1960

tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:37

tvm::ret
PrimExpr ret(PrimExpr value, Span span=Span())
Return the value.

tvm::DataType
runtime::DataType DataType
Definition: data_type.h:458

tvm::Device
DLDevice Device
Definition: device_api.h:42

object.h
A managed object in the TVM runtime.

base.h

serializer.h
Serializer extension to support TVM data types Include this file to enable serialization of DLDataTyp...