tvm
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros
device_api.h
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  * http://www.apache.org/licenses/LICENSE-2.0
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
14  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
19 
24 #ifndef TVM_RUNTIME_DEVICE_API_H_
25 #define TVM_RUNTIME_DEVICE_API_H_
26 
28 #include <tvm/runtime/ndarray.h>
30 
31 #include <string>
32 
33 namespace tvm {
34 namespace runtime {
38 enum DeviceAttrKind : int {
39  kExist = 0,
41  kWarpSize = 2,
49  kGcnArch = 10,
56 };
57 
58 #ifdef TVM_KALLOC_ALIGNMENT
60 constexpr int kAllocAlignment = TVM_KALLOC_ALIGNMENT;
61 
63 constexpr int kTempAllocaAlignment = TVM_KALLOC_ALIGNMENT;
64 #else
66 constexpr int kAllocAlignment = 64;
67 
69 constexpr int kTempAllocaAlignment = 64;
70 #endif // TVM_KALLOC_ALIGNMENT
71 
73 constexpr int kMaxStackAlloca = 1024;
74 
77 constexpr int kDefaultWorkspaceAlignment = 1;
78 
83 class TVM_DLL DeviceAPI {
84  public:
86  virtual ~DeviceAPI() {}
91  virtual void SetDevice(Device dev) = 0;
99  virtual void GetAttr(Device dev, DeviceAttrKind kind, TVMRetValue* rv) = 0;
100 
107  virtual size_t GetDataSize(const DLTensor& arr, Optional<String> mem_scope = NullOpt);
108 
115  virtual void GetTargetProperty(Device dev, const std::string& property, TVMRetValue* rv) {}
116 
126  virtual void* AllocDataSpace(Device dev, size_t nbytes, size_t alignment,
127  DLDataType type_hint) = 0;
137  virtual void* AllocDataSpace(Device dev, int ndim, const int64_t* shape, DLDataType dtype,
138  Optional<String> mem_scope = NullOpt);
144  virtual void FreeDataSpace(Device dev, void* ptr) = 0;
155  virtual void CopyDataFromTo(DLTensor* from, DLTensor* to, TVMStreamHandle stream);
162 
169  virtual void FreeStream(Device dev, TVMStreamHandle stream);
170 
176  virtual void StreamSync(Device dev, TVMStreamHandle stream) = 0;
182  virtual void SetStream(Device dev, TVMStreamHandle stream) {}
201  virtual void SyncStreamFromTo(Device dev, TVMStreamHandle event_src, TVMStreamHandle event_dst);
218  virtual void* AllocWorkspace(Device dev, size_t nbytes, DLDataType type_hint = {});
225  virtual void FreeWorkspace(Device dev, void* ptr);
226 
233  static DeviceAPI* Get(Device dev, bool allow_missing = false);
234 
240  static bool NeedSetDevice(int device_type) { return device_type != kDLCPU; }
241 
245  virtual bool SupportsDevicePointerArithmeticsOnHost() { return false; }
246 
247  protected:
261  virtual void CopyDataFromTo(const void* from, size_t from_offset, void* to, size_t to_offset,
262  size_t num_bytes, Device dev_from, Device dev_to,
263  DLDataType type_hint, TVMStreamHandle stream);
264 };
265 
267 constexpr int kRPCSessMask = 128;
268 static_assert(kRPCSessMask >= TVMDeviceExtType_End);
269 
273 inline bool IsRPCSessionDevice(Device dev) { return (dev.device_type / kRPCSessMask) > 0; }
274 
279 inline int GetRPCSessionIndex(Device dev) {
280  ICHECK(IsRPCSessionDevice(dev)) << "GetRPCSessionIndex: dev has no RPC session";
281  return dev.device_type / kRPCSessMask - 1;
282 }
283 
292  dev.device_type = static_cast<DLDeviceType>(dev.device_type % kRPCSessMask);
293  return dev;
294 }
295 
296 inline std::ostream& operator<<(std::ostream& os, DLDevice dev) { // NOLINT(*)
298  os << "remote[" << tvm::runtime::GetRPCSessionIndex(dev) << "]-";
300  }
301  os << tvm::runtime::DLDeviceType2Str(static_cast<int>(dev.device_type)) << ":" << dev.device_id;
302  return os;
303 }
304 
312 inline Device AddRPCSessionMask(Device dev, int session_table_index) {
313  CHECK(!IsRPCSessionDevice(dev)) << "AddRPCSessionMask: dev already non-zero RPCSessionIndex: "
314  << dev;
315  dev.device_type =
316  static_cast<DLDeviceType>(dev.device_type | (kRPCSessMask * (session_table_index + 1)));
317  return dev;
318 }
319 
320 } // namespace runtime
321 } // namespace tvm
322 
323 #endif // TVM_RUNTIME_DEVICE_API_H_
@ TVMDeviceExtType_End
Definition: c_runtime_api.h:122
void * TVMStreamHandle
The stream that is specific to device can be NULL, which indicates the default one.
Definition: c_runtime_api.h:230
TVM Runtime Device API, abstracts the device specific interface for memory management.
Definition: device_api.h:83
static bool NeedSetDevice(int device_type)
Whether a certian device type requires set device device before launching the kernel function.
Definition: device_api.h:240
static DeviceAPI * Get(Device dev, bool allow_missing=false)
Get device API based on device.
virtual void CopyDataFromTo(DLTensor *from, DLTensor *to, TVMStreamHandle stream)
copy data from one place to another
virtual TVMStreamHandle CreateStream(Device dev)
Create a new stream of execution.
virtual void SyncStreamFromTo(Device dev, TVMStreamHandle event_src, TVMStreamHandle event_dst)
Synchronize 2 streams of execution.
virtual void FreeWorkspace(Device dev, void *ptr)
Free temporal workspace in backend execution.
virtual bool SupportsDevicePointerArithmeticsOnHost()
Whether pointer arithmetics on a device owned pointer may be performed on the host.
Definition: device_api.h:245
virtual void * AllocDataSpace(Device dev, int ndim, const int64_t *shape, DLDataType dtype, Optional< String > mem_scope=NullOpt)
Allocate a data space on device with memory scope support.
virtual void SetDevice(Device dev)=0
Set the environment device id to device.
virtual void FreeStream(Device dev, TVMStreamHandle stream)
Free a stream of execution.
virtual TVMStreamHandle GetCurrentStream(Device dev)
Get the current stream.
virtual void GetTargetProperty(Device dev, const std::string &property, TVMRetValue *rv)
Query the device for specified properties.
Definition: device_api.h:115
virtual size_t GetDataSize(const DLTensor &arr, Optional< String > mem_scope=NullOpt)
Get the physical memory size required.
virtual void * AllocWorkspace(Device dev, size_t nbytes, DLDataType type_hint={})
Allocate temporal workspace for backend execution.
virtual void GetAttr(Device dev, DeviceAttrKind kind, TVMRetValue *rv)=0
Get attribute of specified device.
virtual void StreamSync(Device dev, TVMStreamHandle stream)=0
Synchronize the stream.
virtual void FreeDataSpace(Device dev, void *ptr)=0
Free a data space on device.
virtual void CopyDataFromTo(const void *from, size_t from_offset, void *to, size_t to_offset, size_t num_bytes, Device dev_from, Device dev_to, DLDataType type_hint, TVMStreamHandle stream)
copy data from one place to another
virtual void SetStream(Device dev, TVMStreamHandle stream)
Set the stream.
Definition: device_api.h:182
virtual void * AllocDataSpace(Device dev, size_t nbytes, size_t alignment, DLDataType type_hint)=0
Allocate a data space on device.
virtual ~DeviceAPI()
virtual destructor
Definition: device_api.h:86
Optional container that to represent to a Nullable variant of T.
Definition: optional.h:51
Return Value container, Unlike TVMArgValue, which only holds reference and do not delete the underlyi...
Definition: packed_func.h:946
constexpr int kMaxStackAlloca
Maximum size that can be allocated on stack.
Definition: device_api.h:73
DeviceAttrKind
the query type into GetAttr
Definition: device_api.h:38
@ kDeviceName
Definition: device_api.h:44
@ kDriverVersion
Definition: device_api.h:51
@ kMaxThreadsPerBlock
Definition: device_api.h:40
@ kMultiProcessorCount
Definition: device_api.h:46
@ kMaxThreadDimensions
Definition: device_api.h:47
@ kApiVersion
Definition: device_api.h:50
@ kImagePitchAlignment
Definition: device_api.h:55
@ kMaxClockRate
Definition: device_api.h:45
@ kWarpSize
Definition: device_api.h:41
@ kTotalGlobalMemory
Definition: device_api.h:53
@ kAvailableGlobalMemory
Definition: device_api.h:54
@ kMaxRegistersPerBlock
Definition: device_api.h:48
@ kComputeVersion
Definition: device_api.h:43
@ kGcnArch
Definition: device_api.h:49
@ kMaxSharedMemoryPerBlock
Definition: device_api.h:42
@ kExist
Definition: device_api.h:39
@ kL2CacheSizeBytes
Definition: device_api.h:52
constexpr int kRPCSessMask
The device type bigger than this is RPC device.
Definition: device_api.h:267
constexpr int kDefaultWorkspaceAlignment
Number of bytes each allocation must align to by default in the workspace buffer to service intermedi...
Definition: device_api.h:77
int GetRPCSessionIndex(Device dev)
Return the RPCSessTable index of the RPC Session that owns this device.
Definition: device_api.h:279
constexpr int kTempAllocaAlignment
Number of bytes each allocation must align to in temporary allocation.
Definition: device_api.h:69
bool IsRPCSessionDevice(Device dev)
Return true if a Device is owned by an RPC session.
Definition: device_api.h:273
Device AddRPCSessionMask(Device dev, int session_table_index)
Add a RPC session mask to a Device. RPC clients typically do this when decoding a Device received fro...
Definition: device_api.h:312
constexpr int kAllocAlignment
Number of bytes each allocation must align to.
Definition: device_api.h:66
std::ostream & operator<<(std::ostream &os, const ObjectRef &n)
Definition: repr_printer.h:97
Device RemoveRPCSessionMask(Device dev)
Remove the RPC session mask from a Device. RPC clients typically do this when encoding a Device for t...
Definition: device_api.h:291
constexpr const char * device_type
The device type.
Definition: stmt.h:1422
Tensor shape(const Tensor &src, DataType dtype, const std::string name="T_shape", const std::string tag=kInjective)
Get the shape of input tensor.
Definition: transform.h:1913
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:36
DLDevice Device
Definition: ndarray.h:43
constexpr runtime::NullOptType NullOpt
Definition: optional.h:169
A device-independent managed NDArray abstraction.
Type-erased function used across TVM API.