api/doxygen/cublas_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_TOPI_CONTRIB_CUBLAS_H_

 #define TVM_TOPI_CONTRIB_CUBLAS_H_


 #include <tvm/te/operation.h>

 #include <tvm/topi/detail/extern.h>


 namespace tvm {

 namespace topi {

 namespace contrib {


 using namespace tvm::te;

 using namespace topi::detail;

 inline Tensor cublas_matmul(const Tensor& lhs, const Tensor& rhs, bool transa, bool transb) {

   auto n = transa ? lhs->shape[1] : lhs->shape[0];

   auto m = transb ? rhs->shape[0] : rhs->shape[1];


   return make_extern(

       {{n, m}}, {lhs->dtype}, {lhs, rhs},

       [&](Array<Buffer> ins, Array<Buffer> outs) {

         return call_packed({StringImm("tvm.contrib.cublas.matmul"), pack_buffer(ins[0]),

                             pack_buffer(ins[1]), pack_buffer(outs[0]), transa, transb});

       },

       "C", "", {})[0];

 }


 inline Tensor cublas_batch_matmul(const Tensor& lhs, const Tensor& rhs, bool transa, bool transb) {

   auto b = lhs->shape[0];

   auto n = transa ? lhs->shape[2] : lhs->shape[1];

   auto m = transb ? rhs->shape[1] : rhs->shape[2];


   return make_extern(

       {{b, n, m}}, {lhs->dtype}, {lhs, rhs},

       [&](Array<Buffer> ins, Array<Buffer> outs) {

         return call_packed({StringImm("tvm.contrib.cublas.batch_matmul"), pack_buffer(ins[0]),

                             pack_buffer(ins[1]), pack_buffer(outs[0]), transa, transb});

       },

       "C", "", {})[0];

 }


 }  // namespace contrib

 }  // namespace topi

 }  // namespace tvm


 #endif  // TVM_TOPI_CONTRIB_CUBLAS_H_

tvm::runtime::Array
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102

tvm::tir::StringImm
Managed reference to StringImmNode.
Definition: expr.h:78

extern.h
Helpers for using external functions.

tvm::te
Tensor expression language DSL.
Definition: extracted_task.h:33

tvm::topi::contrib::cublas_matmul
Tensor cublas_matmul(const Tensor &lhs, const Tensor &rhs, bool transa, bool transb)
Create an op that multiplies lhs and rhs with cuBLAS.
Definition: cublas.h:46

tvm::topi::contrib::cublas_batch_matmul
Tensor cublas_batch_matmul(const Tensor &lhs, const Tensor &rhs, bool transa, bool transb)
Create an op that multiplies batch matrices lhs and rhs with cuBLAS.
Definition: cublas.h:70

tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:36

operation.h
Operation node can generate one or multiple Tensors.