api/doxygen/cuda__ipc__memory_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_RUNTIME_DISCO_CUDA_IPC_MEMORY_H_

 #define TVM_RUNTIME_DISCO_CUDA_IPC_MEMORY_H_


 #include <tvm/runtime/c_runtime_api.h>

 #include <tvm/runtime/memory/memory_manager.h>

 #include <tvm/runtime/object.h>


 #include <vector>


 namespace tvm {

 namespace runtime {

 namespace cuda_ipc {


 class CUDAIPCMemoryObj : public Object {

  public:

   int num_workers;

   int worker_id;

   std::vector<void*> remote_data;


   // We introduce the barrier helper data below per CUDAIPCMemory object

   // so that they can be used by custom collective operations and allow

   // fine-grained synchronization on each buffer. These barriers have

   // low overhead, and can potentially enable concurrent execution of

   // kernels in future.

   std::vector<void*> barrier_in;

   std::vector<void*> barrier_out;

   int barrier_flag;


   static constexpr const char* _type_key = "tvm.runtime.disco.cuda_ipc_memory";

   static constexpr const bool _type_has_method_sequal_reduce = false;

   static constexpr const bool _type_has_method_shash_reduce = false;

   TVM_DECLARE_BASE_OBJECT_INFO(CUDAIPCMemoryObj, Object);

 };


 class CUDAIPCMemory : public ObjectRef {

  public:

   TVM_DLL static memory::Allocator* GlobalAllocator();

   TVM_DLL static CUDAIPCMemory GetIPCMemoryFromDevicePtr(void* ptr);


   TVM_DEFINE_MUTABLE_OBJECT_REF_METHODS(CUDAIPCMemory, ObjectRef, CUDAIPCMemoryObj);

 };


 }  // namespace cuda_ipc

 }  // namespace runtime

 }  // namespace tvm


 #endif  // TVM_RUNTIME_DISCO_CUDA_IPC_MEMORY_H_

c_runtime_api.h

tvm::runtime::ObjectRef
Base class of all object reference.
Definition: object.h:520

tvm::runtime::Object
base class of all object containers.
Definition: object.h:172

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj
The CUDA IPC (interprocess communication) memory object, which internally contains data pointers to C...
Definition: cuda_ipc_memory.h:41

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::_type_has_method_shash_reduce
static constexpr const bool _type_has_method_shash_reduce
Definition: cuda_ipc_memory.h:75

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::_type_has_method_sequal_reduce
static constexpr const bool _type_has_method_sequal_reduce
Definition: cuda_ipc_memory.h:74

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::_type_key
static constexpr const char * _type_key
Definition: cuda_ipc_memory.h:73

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::barrier_out
std::vector< void * > barrier_out
The pointers to output barrier signals of all workers for all-reduce. It has "num_workers" pointers,...
Definition: cuda_ipc_memory.h:69

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::barrier_in
std::vector< void * > barrier_in
The pointers to input barrier signals of all workers for all-reduce. It has "num_workers" pointers,...
Definition: cuda_ipc_memory.h:64

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::barrier_flag
int barrier_flag
The integer buffer flag for all-reduce.
Definition: cuda_ipc_memory.h:71

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::num_workers
int num_workers
The number of GPU workers.
Definition: cuda_ipc_memory.h:44

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::worker_id
int worker_id
The worker id corresponding to this IPC memory object.
Definition: cuda_ipc_memory.h:46

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::TVM_DECLARE_BASE_OBJECT_INFO
TVM_DECLARE_BASE_OBJECT_INFO(CUDAIPCMemoryObj, Object)

tvm::runtime::cuda_ipc::CUDAIPCMemoryObj::remote_data
std::vector< void * > remote_data
The data pointers of all all-reduce inputs. It has "num_workers" pointers. The i-th pointer is the da...
Definition: cuda_ipc_memory.h:53

tvm::runtime::cuda_ipc::CUDAIPCMemory
Managed reference to CUDAIPCMemoryObj.
Definition: cuda_ipc_memory.h:83

tvm::runtime::cuda_ipc::CUDAIPCMemory::GlobalAllocator
static memory::Allocator * GlobalAllocator()
Get the global singleton CUDAIPCMemory allocator.

tvm::runtime::cuda_ipc::CUDAIPCMemory::TVM_DEFINE_MUTABLE_OBJECT_REF_METHODS
TVM_DEFINE_MUTABLE_OBJECT_REF_METHODS(CUDAIPCMemory, ObjectRef, CUDAIPCMemoryObj)

tvm::runtime::cuda_ipc::CUDAIPCMemory::GetIPCMemoryFromDevicePtr
static CUDAIPCMemory GetIPCMemoryFromDevicePtr(void *ptr)
Given a local CUDA data pointer, return the CUDAIPCMemory object of the pointer.

tvm::runtime::memory::Allocator
Definition: memory_manager.h:58

memory_manager.h
Abstract device memory management API.

tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:36

object.h
A managed object in the TVM runtime.