api/doxygen/topi_2nn_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_TOPI_NN_H_

 #define TVM_TOPI_NN_H_


 #include <tvm/arith/analyzer.h>

 #include <tvm/te/operation.h>

 #include <tvm/tir/expr.h>

 #include <tvm/tir/op.h>

 #include <tvm/topi/detail/constant_utils.h>

 #include <tvm/topi/reduction.h>

 #include <tvm/topi/tags.h>

 #include <tvm/topi/transform.h>


 #include <algorithm>

 #include <string>


 namespace tvm {

 namespace topi {


 using namespace tvm::te;


 template <typename T>

 inline tvm::te::Tensor relu(const tvm::te::Tensor& t, T threshold = static_cast<T>(0),

                             std::string name = "T_relu", std::string tag = kElementWise) {

   return tvm::te::compute(

       t->shape,

       [&](const tvm::Array<tvm::tir::Var>& i) {

         auto threshold_const = tvm::tir::make_const(t->dtype, threshold);

         return tvm::max(t(i), threshold_const);

       },

       name, tag);

 }


 inline tvm::te::Tensor leaky_relu(const tvm::te::Tensor& t, double alpha = 0.1,

                                   std::string name = "T_leaky_relu",

                                   std::string tag = kElementWise) {

   return tvm::te::compute(

       t->shape,

       [&](const tvm::Array<tvm::tir::Var>& i) {

         auto value = t(i);

         auto calpha = tvm::tir::make_const(value.dtype(), alpha);

         return tvm::tir::Select(value > 0, value, value * calpha);

       },

       name, tag);

 }


 inline tvm::te::Tensor prelu(const tvm::te::Tensor& x, const tvm::te::Tensor& slope,

                              const int axis = 1, std::string name = "T_prelu",

                              std::string tag = kBroadcast) {

   ICHECK((size_t)axis < x->shape.size()) << "Wrong axis (" << axis << ")value. ";

   ICHECK(topi::detail::GetConstInt(slope->shape[0]) == topi::detail::GetConstInt(x->shape[axis]))

       << "Wrong slope shape received.";


   return tvm::te::compute(

       x->shape,

       [&](const tvm::Array<tvm::tir::Var>& indices) {

         auto xval = x(indices);

         return tvm::tir::Select(xval > 0, xval, xval * slope(indices[axis]));

       },

       name, tag);

 }


 inline tvm::te::Tensor pad(const tvm::te::Tensor& t, const tvm::Array<tvm::PrimExpr>& pad_before,

                            tvm::Array<tvm::PrimExpr> pad_after = tvm::Array<tvm::PrimExpr>(),

                            PrimExpr pad_value = PrimExpr(), std::string name = "T_pad",

                            std::string tag = kElementWise, std::string pad_mode = "constant",

                            const Array<PrimExpr>* dyn_output_shape = nullptr) {

   if (pad_after.size() < pad_before.size()) {

     for (size_t i = pad_after.size(); i < pad_before.size(); ++i) {

       pad_after.push_back(pad_before[i]);

     }

   }


   arith::Analyzer analyzer;

   ICHECK_GE(pad_before.size(), 1);

   ICHECK_EQ(pad_before.size(), pad_after.size());

   tvm::Array<tvm::PrimExpr> pad_before_int32;

   tvm::Array<tvm::PrimExpr> pad_after_int32;


   for (const auto& ele : pad_before) {

     pad_before_int32.push_back(tvm::cast(tvm::DataType::Int(32), ele));

   }

   for (const auto& ele : pad_after) {

     pad_after_int32.push_back(tvm::cast(tvm::DataType::Int(32), ele));

   }


   tvm::Array<tvm::PrimExpr> output_shape;

   if (dyn_output_shape == nullptr) {

     for (size_t i = 0; i < t->shape.size(); ++i) {

       if (i >= pad_before.size()) {

         output_shape.push_back(t->shape[i]);

       } else {

         output_shape.push_back(

             analyzer.Simplify(t->shape[i] + pad_before_int32[i] + pad_after_int32[i]));

       }

     }

   } else {

     for (size_t i = 0; i < dyn_output_shape->size(); i++) {

       output_shape.push_back((*dyn_output_shape)[i]);

     }

   }


   if (!pad_value.defined()) {

     pad_value = tvm::tir::make_const(t->dtype, 0);

   }


   auto l = [&](tvm::Array<tvm::tir::Var> ovars) {

     tvm::Array<tvm::PrimExpr> indices;

     tvm::Array<tvm::PrimExpr> sel;

     tvm::Array<tvm::PrimExpr> pad_idx;

     for (size_t i = 0; i < t->shape.size(); ++i) {

       if (i >= pad_before_int32.size()) {

         indices.push_back(ovars[i]);

         continue;

       }

       if (!topi::detail::EqualCheck(pad_before_int32[i], 0)) {

         sel.push_back(ovars[i] >= pad_before_int32[i]);

         indices.push_back(ovars[i] - pad_before_int32[i]);

       } else {

         indices.push_back(ovars[i]);

       }

       if (!topi::detail::EqualCheck(pad_after_int32[i], 0)) {

         sel.push_back(analyzer.Simplify(ovars[i] < pad_before_int32[i] + t->shape[i]));

       }

       if (pad_mode == "edge") {

         pad_idx.push_back(

             tvm::if_then_else(ovars[i] < pad_before[i], 0,

                               tvm::if_then_else(ovars[i] >= pad_before[i] + t->shape[i],

                                                 t->shape[i] - 1, ovars[i] - pad_before[i])));

       } else if (pad_mode == "reflect") {

         pad_idx.push_back(

             tvm::if_then_else(ovars[i] < pad_before[i], pad_before[i] - ovars[i],

                               tvm::if_then_else(ovars[i] >= pad_before[i] + t->shape[i],

                                                 t->shape[i] * 2 - ovars[i] + pad_before[i] - 2,

                                                 ovars[i] - pad_before[i])));

       }

     }

     if (sel.size() != 0) {

       if (pad_mode == "constant") {

         return tvm::if_then_else(

             foldl([](PrimExpr a, PrimExpr b, Span span) { return tvm::logical_and(a, b, span); },

                   const_true(1), sel),

             t(indices), pad_value);

       } else if (pad_mode == "edge" || pad_mode == "reflect") {

         return tvm::if_then_else(

             foldl([](PrimExpr a, PrimExpr b, Span span) { return tvm::logical_and(a, b, span); },

                   const_true(1), sel),

             t(indices), t(pad_idx));

       }

     }

     return t(indices);

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor conv2d_nchw(const tvm::te::Tensor& I, const tvm::te::Tensor& W,

                                    int pad_h = 0, int pad_w = 0, int stride_h = 1, int stride_w = 1,

                                    std::string name = "T_conv2d_nchw",

                                    std::string tag = kConv2dNCHW) {

   ICHECK_EQ(4, I->shape.size());

   ICHECK_EQ(4, W->shape.size());

   auto pH = I->shape[2];

   auto pW = I->shape[3];

   tvm::Array<tvm::PrimExpr> output_shape{

       I->shape[0],                                                    // B

       W->shape[0],                                                    // O

       indexdiv(I->shape[2] - W->shape[2] + 2 * pad_h, stride_h) + 1,  // H

       indexdiv(I->shape[3] - W->shape[3] + 2 * pad_w, stride_w) + 1   // W

   };

   auto i = tvm::te::reduce_axis(tvm::Range{0, I->shape[1]}, "i");

   auto kh = tvm::te::reduce_axis(tvm::Range{0, W->shape[2]}, "kh");

   auto kw = tvm::te::reduce_axis(tvm::Range{0, W->shape[3]}, "kw");

   auto T =

       (pad_h == 0 && pad_w == 0) ? I : pad(I, {tvm::PrimExpr(0), tvm::PrimExpr(0), pad_h, pad_w});

   auto l = [&](tvm::tir::Var b, tvm::tir::Var o, tvm::tir::Var h, tvm::tir::Var w) {

     return tvm::sum(T(b, i, stride_h * h + kh, stride_w * w + kw) * W(o, i, kh, kw), {i, kh, kw});

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor conv2d_hwcn(const tvm::te::Tensor& I, const tvm::te::Tensor& W,

                                    int pad_h = 0, int pad_w = 0, int stride_h = 1, int stride_w = 1,

                                    std::string name = "T_conv2d_hwcn",

                                    std::string tag = kConv2dHWCN) {

   ICHECK_EQ(4, I->shape.size());

   ICHECK_EQ(4, W->shape.size());

   auto pH = I->shape[2];

   auto pW = I->shape[3];

   tvm::Array<tvm::PrimExpr> output_shape{

       indexdiv(I->shape[2] - W->shape[2] + 2 * pad_h, stride_h) + 1,  // H

       indexdiv(I->shape[3] - W->shape[3] + 2 * pad_w, stride_w) + 1,  // W

       I->shape[2],                                                    // B

       W->shape[3]                                                     // O

   };

   auto i = tvm::te::reduce_axis(tvm::Range{0, I->shape[3]}, "i");

   auto kh = tvm::te::reduce_axis(tvm::Range{0, W->shape[0]}, "kh");

   auto kw = tvm::te::reduce_axis(tvm::Range{0, W->shape[1]}, "kw");

   auto T = (pad_h == 0 && pad_w == 0) ? I : pad(I, {pad_h, pad_w});

   auto l = [&](tvm::tir::Var b, tvm::tir::Var o, tvm::tir::Var h, tvm::tir::Var w) {

     return tvm::sum(T(stride_h * h + kh, stride_w * w + kw, i, b) * W(kh, kw, i, o), {i, kh, kw});

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor depthwise_conv2d_nchw(const tvm::te::Tensor& I, const tvm::te::Tensor& W,

                                              int pad_h = 0, int pad_w = 0, int stride_h = 1,

                                              int stride_w = 1,

                                              std::string name = "T_depthwise_conv2d_nchw",

                                              std::string tag = kDepthwiseConv2dNCHW) {

   ICHECK_EQ(4, I->shape.size());

   ICHECK_EQ(4, W->shape.size());

   auto pH = I->shape[2];

   auto pW = I->shape[3];

   auto pCM = W->shape[1];  // channel_multiplier

   tvm::Array<tvm::PrimExpr> output_shape{

       I->shape[0],                                                    // B

       W->shape[1],                                                    // O

       indexdiv(I->shape[2] - W->shape[2] + 2 * pad_h, stride_h) + 1,  // H

       indexdiv(I->shape[3] - W->shape[3] + 2 * pad_w, stride_w) + 1   // W

   };

   auto i = tvm::te::reduce_axis(tvm::Range{0, I->shape[1]}, "i");

   auto kh = tvm::te::reduce_axis(tvm::Range{0, W->shape[2]}, "kh");

   auto kw = tvm::te::reduce_axis(tvm::Range{0, W->shape[3]}, "kw");

   auto T =

       (pad_h == 0 && pad_w == 0) ? I : pad(I, {tvm::PrimExpr(0), tvm::PrimExpr(0), pad_h, pad_w});

   auto l = [&](tvm::tir::Var b, tvm::tir::Var o, tvm::tir::Var h, tvm::tir::Var w) {

     return tvm::sum(T(b, indexdiv(i, pCM), stride_h * h + kh, stride_w * w + kw) *

                         W(indexdiv(i, pCM), indexmod(o, pCM), kh, kw),

                     {i, kh, kw});

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor depthwise_conv2d_nhwc(const tvm::te::Tensor& I, const tvm::te::Tensor& W,

                                              int pad_h = 0, int pad_w = 0, int stride_h = 1,

                                              int stride_w = 1,

                                              std::string name = "T_depthwise_conv2d_nhwc",

                                              std::string tag = kDepthwiseConv2dNHWC) {

   ICHECK_EQ(4, I->shape.size());

   ICHECK_EQ(4, W->shape.size());

   auto pH = I->shape[1];

   auto pW = I->shape[2];

   auto pCM = W->shape[1];  // channel_multiplier

   tvm::Array<tvm::PrimExpr> output_shape{

       I->shape[0],                                                    // B

       indexdiv(I->shape[1] - W->shape[1] + 2 * pad_h, stride_h) + 1,  // H

       indexdiv(I->shape[2] - W->shape[2] + 2 * pad_w, stride_w) + 1,  // W

       W->shape[3],                                                    // O

   };

   auto i = tvm::te::reduce_axis(tvm::Range{0, I->shape[3]}, "i");

   auto kh = tvm::te::reduce_axis(tvm::Range{0, W->shape[0]}, "kh");

   auto kw = tvm::te::reduce_axis(tvm::Range{0, W->shape[1]}, "kw");

   auto T =

       (pad_h == 0 && pad_w == 0) ? I : pad(I, {tvm::PrimExpr(0), pad_h, pad_w, tvm::PrimExpr(0)});

   auto l = [&](tvm::tir::Var b, tvm::tir::Var h, tvm::tir::Var w, tvm::tir::Var o) {

     return tvm::sum(T(b, stride_h * h + kh, stride_w * w + kw, indexdiv(i, pCM)) *

                         W(kh, kw, indexdiv(i, pCM), indexmod(o, pCM)),

                     {kh, kw, i});

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor group_conv2d_ngchw(const tvm::te::Tensor& I, const tvm::te::Tensor& W,

                                           int pad_h = 0, int pad_w = 0, int stride_h = 1,

                                           int stride_w = 1,

                                           std::string name = "T_group_conv2d_ngchw",

                                           std::string tag = kGroupConv2d) {

   ICHECK_EQ(5, I->shape.size());

   ICHECK_EQ(5, W->shape.size());

   auto pH = I->shape[2];

   auto pW = I->shape[3];

   tvm::Array<tvm::PrimExpr> output_shape{

       I->shape[0],                                                    // B

       I->shape[1],                                                    // G

       W->shape[2],                                                    // O

       indexdiv(I->shape[3] - W->shape[3] + 2 * pad_h, stride_h) + 1,  // H

       indexdiv(I->shape[4] - W->shape[4] + 2 * pad_w, stride_w) + 1   // W

   };

   auto i = tvm::te::reduce_axis(tvm::Range{0, I->shape[2]}, "i");

   auto kh = tvm::te::reduce_axis(tvm::Range{0, W->shape[3]}, "kh");

   auto kw = tvm::te::reduce_axis(tvm::Range{0, W->shape[4]}, "kw");


   auto T = (pad_h == 0 && pad_w == 0)

                ? I

                : pad(I, {tvm::PrimExpr(0), tvm::PrimExpr(0), tvm::PrimExpr(0), pad_h, pad_w});

   auto l = [&](tvm::Array<tvm::tir::Var> args) {

     tvm::tir::Var b = args[0];

     tvm::tir::Var g = args[1];

     tvm::tir::Var o = args[2];

     tvm::tir::Var h = args[3];

     tvm::tir::Var w = args[4];

     return tvm::sum(I(b, g, i, stride_h * h + kh, stride_w * w + kw) * W(g, i, o, kh, kw),

                     {i, kh, kw});

   };

   return tvm::te::compute(output_shape, l, name, tag);

 }


 inline tvm::te::Tensor space_to_batch_nd(const tvm::te::Tensor& data,

                                          const tvm::Array<Integer>& block_shape,

                                          const tvm::Array<tvm::PrimExpr>& pad_before,

                                          const tvm::Array<tvm::PrimExpr>& pad_after,

                                          PrimExpr pad_value = PrimExpr(),

                                          std::string name = "space_to_batch_nd",

                                          std::string tag = kInjective) {

   tvm::te::Tensor padded_t;

   CHECK_EQ(pad_before.size(), pad_after.size());

   CHECK_EQ(block_shape.size(), pad_before.size())

       << "Paddings must be provided for each spatial dimension";

   tvm::Array<tvm::PrimExpr> pad_before_int32;

   tvm::Array<tvm::PrimExpr> pad_after_int32;


   // pad size for batch dimension is 0

   pad_before_int32.push_back(tvm::cast(tvm::DataType::Int(32), 0));

   pad_after_int32.push_back(tvm::cast(tvm::DataType::Int(32), 0));

   // insert pad sizes given for spatial dimensions

   for (const auto& ele : pad_before) {

     pad_before_int32.push_back(tvm::cast(tvm::DataType::Int(32), ele));

   }

   for (const auto& ele : pad_after) {

     pad_after_int32.push_back(tvm::cast(tvm::DataType::Int(32), ele));

   }


   // pad the input with paddings provided

   if (!pad_value.defined()) {

     pad_value = tvm::tir::make_const(data->dtype, 0);

   }

   padded_t = pad(data, pad_before_int32, pad_after_int32, pad_value);


   auto input_shape = data->shape;

   auto padded_shape = padded_t->shape;


   // infer shapes

   tvm::Array<PrimExpr> r_shape;

   tvm::Array<Integer> axis;

   tvm::Array<PrimExpr> o_shape;


   size_t num_block_dims = block_shape.size();

   int batch = static_cast<int>(GetConstInt(input_shape[0]));

   tvm::PrimExpr block_shape_prod(1);

   r_shape.push_back(batch);


   for (size_t i = 1; i <= num_block_dims; i++) {

     int padded_input = static_cast<int>(GetConstInt(padded_shape[i]));

     int block_size = static_cast<int>(GetConstInt(block_shape[i - 1]));

     CHECK_EQ((padded_input % block_size), 0)

         << "(" << i

         << ")th "

            "Input dimension after padding ("

         << padded_input << ")"

         << " must be divisible by its block size (" << block_size << ")";


     r_shape.push_back(div(padded_shape[i], block_shape[i - 1]));

     r_shape.push_back(block_shape[i - 1]);

     block_shape_prod *= block_shape[i - 1];

     axis.push_back(Integer(r_shape.size() - 1));  // index of block_shape[i - 1]

   }


   size_t n = axis.size();

   axis.push_back(0);  // batch is at index 0

   // index of (padded_shape[i] / block_shape[i - 1]) in r_shape

   for (size_t i = 0; i < n; i++) {

     axis.push_back(static_cast<int>(GetConstInt(axis[i] - 1)));

   }

   o_shape.push_back(tvm::PrimExpr(batch) * block_shape_prod);

   for (size_t i = 1; i <= num_block_dims; i++) {

     o_shape.push_back(div(padded_shape[i], block_shape[i - 1]));

   }

   // append remaining shape

   for (size_t i = num_block_dims + 1; i < input_shape.size(); i++) {

     r_shape.push_back(input_shape[i]);

     axis.push_back(Integer(r_shape.size() - 1));  // index of remaining shape in r_shape

     o_shape.push_back(input_shape[i]);

   }


   tvm::te::Tensor output = reshape(padded_t, r_shape);

   output = transpose(output, axis);

   output = reshape(output, o_shape);


   return output;

 }


 inline tvm::te::Tensor batch_to_space_nd(const tvm::te::Tensor& data,

                                          const tvm::Array<Integer>& block_shape,

                                          const tvm::Array<tvm::PrimExpr>& crop_begin_list,

                                          const tvm::Array<tvm::PrimExpr>& crop_end_list,

                                          std::string name = "batch_to_space_nd",

                                          std::string tag = kInjective) {

   // Construct shapes for reshape and transpose operation

   Array<PrimExpr> in_shape = data->shape;

   Array<PrimExpr> r_shape;

   Array<Integer> axis;

   size_t num_block_dims = block_shape.size();

   size_t num_input_dims = in_shape.size();

   tvm::PrimExpr block_shape_prod(1);

   int batch = static_cast<int>(GetConstInt(in_shape[0]));


   for (size_t i = 0; i < num_block_dims; i++) {

     r_shape.push_back(block_shape[i]);

     block_shape_prod *= block_shape[i];

   }

   axis.push_back(Integer(r_shape.size()));  // axis of (batch / block_shape_prod)

   r_shape.push_back(batch / block_shape_prod);


   for (size_t i = 1; i < num_input_dims; i++) {

     axis.push_back(Integer(r_shape.size()));  // axis of in_shape[i]

     if (axis.size() < (num_block_dims + num_input_dims)) {

       axis.push_back(Integer(r_shape.size() - (num_block_dims + 1)));  // axis of block_shape[i]

     }

     r_shape.push_back(in_shape[i]);

   }


   Array<PrimExpr> r_p_shape;

   r_p_shape.push_back(batch / block_shape_prod);

   for (size_t i = 1; i <= num_block_dims; i++) {

     r_p_shape.push_back(in_shape[i] * block_shape[i - 1]);

   }

   for (size_t i = num_block_dims + 1; i < num_input_dims; i++) {

     r_p_shape.push_back(in_shape[i]);

   }


   tvm::te::Tensor out;

   out = reshape(data, r_shape);

   out = transpose(out, axis);

   out = reshape(out, r_p_shape);


   // Crop the start and end of dimensions of out

   Array<Integer> begin_idx, end_idx, strides;

   for (size_t i = 0; i < r_p_shape.size(); ++i) {

     strides.push_back(Integer(1));

     if (i > 0 && i <= num_block_dims) {

       // prepare begin and end index for spatial dimensions

       int begin_i = static_cast<int>(GetConstInt(crop_begin_list[i - 1]));

       int end_i = static_cast<int>(GetConstInt(crop_end_list[i - 1]));

       int out_i = static_cast<int>(GetConstInt(r_p_shape[i]));

       CHECK_GT(out_i, (begin_i + end_i))

           << "Incorrect crop sizes for (" << i << ")th dim, can not crop more than"

           << " output size" << out_i << " vs " << (begin_i + end_i);

       begin_idx.push_back(begin_i);

       end_idx.push_back(out_i - end_i);

     } else {

       // ignore the batch and remaining dimension

       begin_idx.push_back(Integer(0));

       end_idx.push_back(static_cast<int>(GetConstInt(r_p_shape[i])));

     }

   }


   out = strided_slice(out, begin_idx, end_idx, strides);

   return out;

 }


 inline Tensor nll_loss(const Tensor& predictions, const Tensor& targets, const Tensor& weights,

                        std::string reduction = "mean", int ignore_index = -100,

                        const std::string name = "nll_loss", const std::string tag = kBroadcast) {

   if (predictions.ndim() == 1) {

     // corner case: no batch in shape

     // prediction->shape = (C,), targets->shape = (), weights->shape = (C,)

     auto T = tvm::te::compute(

         {},

         [&](const tvm::Array<tvm::tir::Var>& target_indices) {

           auto c = targets();

           return tvm::tir::Select(c != ignore_index, -predictions(c) * weights(c),

                                   tvm::tir::make_const(predictions->dtype, 0));

         },

         name, tag);

     if (reduction == "mean") {

       auto W = tvm::te::compute(

           {},

           [&](const tvm::Array<tvm::tir::Var>& target_indices) {

             auto c = targets();

             return tvm::tir::Select(c != ignore_index, weights(c),

                                     tvm::tir::make_const(predictions->dtype, 0));

           },

           name, tag);

       return topi::divide(T, W);

     } else {

       return T;

     }

   }

   auto T = tvm::te::compute(

       targets->shape,

       [&](const tvm::Array<tvm::tir::Var>& target_indices) {

         auto c = targets(target_indices);

         tvm::Array<tvm::PrimExpr> pred_indices;

         pred_indices.push_back(target_indices[0]);  // batch index

         pred_indices.push_back(c);                  // class index

         for (size_t i = 1; i < target_indices.size(); i++) {

           pred_indices.push_back(target_indices[i]);  // indices for multidimensional loss

         }

         return tvm::tir::Select(c != ignore_index, -predictions(pred_indices) * weights(c),

                                 tvm::tir::make_const(predictions->dtype, 0));

       },

       name, tag);

   ICHECK(T->shape.size() != 0);

   if (reduction == "mean") {

     auto W = tvm::te::compute(

         targets->shape,

         [&](const tvm::Array<tvm::tir::Var>& target_indices) {

           auto c = targets(target_indices);

           return tvm::tir::Select(c != ignore_index, weights(c),

                                   tvm::tir::make_const(predictions->dtype, 0));

         },

         name, tag);

     return topi::divide(topi::sum(T, tvm::Array<Integer>(nullptr)),

                         topi::sum(W, tvm::Array<Integer>(nullptr)));

   } else if (reduction == "sum") {

     return topi::sum(T, tvm::Array<Integer>(nullptr));

   } else {  // reduction == "none"

     return T;

   }

 }


 }  // namespace topi

 }  // namespace tvm

 #endif  // TVM_TOPI_NN_H_

analyzer.h
Algebra expression simplifications.

tvm::Integer
Container of constant int that adds more constructors.
Definition: expr.h:594

tvm::PrimExpr
Reference to PrimExprNode.
Definition: expr.h:115

tvm::Range
Range container
Definition: expr.h:687

tvm::Span
Definition: source_map.h:120

tvm::arith::Analyzer
Analyzer that contains bunch of sub-analyzers.
Definition: analyzer.h:629

tvm::arith::Analyzer::Simplify
PrimExpr Simplify(const PrimExpr &expr, int steps=2)
Simplify expr.

tvm::runtime::Array
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289

tvm::runtime::Array::push_back
void push_back(const T &item)
push a new item to the back of the list
Definition: array.h:457

tvm::runtime::Array::size
size_t size() const
Definition: array.h:420

tvm::runtime::DataType::Int
static DataType Int(int bits, int lanes=1)
Construct an int type.
Definition: data_type.h:227

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102

tvm::te::Tensor::ndim
size_t ndim() const
Definition: tensor.h:214

tvm::tir::Select
Managed reference to SelectNode.
Definition: expr.h:609

tvm::tir::Var
a named variable in TIR
Definition: var.h:89

constant_utils.h
Utility functions for handling constants in TVM expressions.

tvm::te
Tensor expression language DSL.
Definition: extracted_task.h:33

tvm::te::reduce_axis
IterVar reduce_axis(Range dom, std::string name="rv")
Create a new IterVar for reduction operations.

tvm::te::compute
Tensor compute(Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", Map< String, ObjectRef > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...

tvm::tir::make_const
PrimExpr make_const(DataType t, ValueType value, Span span=Span())
Make a const value with certain data type.
Definition: op.h:962

tvm::tir::foldl
PrimExpr foldl(FReduce freduce, PrimExpr init_value, const Array< PrimExpr > &values, Span span=Span())
Left fold.
Definition: op.h:868

tvm::tir::const_true
PrimExpr const_true(int lanes=1, Span span=Span())
Make a constant true expression.
Definition: op.h:786

tvm::topi::kElementWise
constexpr auto kElementWise
Definition: tags.h:32

tvm::topi::kBroadcast
constexpr auto kBroadcast
Definition: tags.h:36

tvm::topi::transpose
Tensor transpose(const Tensor &x, Array< Integer > axes, std::string name="T_transpose", std::string tag=kInjective)
Permute the dimensions of an array.
Definition: transform.h:203

tvm::topi::batch_to_space_nd
tvm::te::Tensor batch_to_space_nd(const tvm::te::Tensor &data, const tvm::Array< Integer > &block_shape, const tvm::Array< tvm::PrimExpr > &crop_begin_list, const tvm::Array< tvm::PrimExpr > &crop_end_list, std::string name="batch_to_space_nd", std::string tag=kInjective)
Reshape the batch dimension into spatial dimensions.
Definition: nn.h:578

tvm::topi::strided_slice
Tensor strided_slice(const Tensor &x, const Array< Integer > &begin, const Array< Integer > &end, const Array< Integer > &strides, std::string slice_mode="end", std::string name="T_strided_slice", std::string tag=kInjective)
strided_slice of a tensor
Definition: transform.h:930

tvm::topi::kInjective
constexpr auto kInjective
Definition: tags.h:33

tvm::topi::kConv2dNCHW
constexpr auto kConv2dNCHW
Definition: tags.h:38

tvm::topi::prelu
tvm::te::Tensor prelu(const tvm::te::Tensor &x, const tvm::te::Tensor &slope, const int axis=1, std::string name="T_prelu", std::string tag=kBroadcast)
Creates an operation that performs a parametric rectified linear unit.
Definition: nn.h:100

tvm::topi::pad
tvm::te::Tensor pad(const tvm::te::Tensor &t, const tvm::Array< tvm::PrimExpr > &pad_before, tvm::Array< tvm::PrimExpr > pad_after=tvm::Array< tvm::PrimExpr >(), PrimExpr pad_value=PrimExpr(), std::string name="T_pad", std::string tag=kElementWise, std::string pad_mode="constant", const Array< PrimExpr > *dyn_output_shape=nullptr)
Creates an operation that performs padding.
Definition: nn.h:155

tvm::topi::reshape
Tensor reshape(const Tensor &x, Array< PrimExpr > newshape, std::string name="T_reshape", std::string tag=kInjective)
Reshape a tensor.
Definition: transform.h:327

tvm::topi::group_conv2d_ngchw
tvm::te::Tensor group_conv2d_ngchw(const tvm::te::Tensor &I, const tvm::te::Tensor &W, int pad_h=0, int pad_w=0, int stride_h=1, int stride_w=1, std::string name="T_group_conv2d_ngchw", std::string tag=kGroupConv2d)
Creates an operation that performs a 2-D group convolution with an NGCHW-layout.
Definition: nn.h:434

tvm::topi::leaky_relu
tvm::te::Tensor leaky_relu(const tvm::te::Tensor &t, double alpha=0.1, std::string name="T_leaky_relu", std::string tag=kElementWise)
Creates an operation that performs a leaky rectified linear unit.
Definition: nn.h:76

tvm::topi::divide
tvm::PrimExpr divide(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:239

tvm::topi::kDepthwiseConv2dNCHW
constexpr auto kDepthwiseConv2dNCHW
Definition: tags.h:40

tvm::topi::depthwise_conv2d_nchw
tvm::te::Tensor depthwise_conv2d_nchw(const tvm::te::Tensor &I, const tvm::te::Tensor &W, int pad_h=0, int pad_w=0, int stride_h=1, int stride_w=1, std::string name="T_depthwise_conv2d_nchw", std::string tag=kDepthwiseConv2dNCHW)
Creates an operation that performs a 2-D depthwise convolution with an NCHW-layout.
Definition: nn.h:356

tvm::topi::kGroupConv2d
constexpr auto kGroupConv2d
Definition: tags.h:45

tvm::topi::space_to_batch_nd
tvm::te::Tensor space_to_batch_nd(const tvm::te::Tensor &data, const tvm::Array< Integer > &block_shape, const tvm::Array< tvm::PrimExpr > &pad_before, const tvm::Array< tvm::PrimExpr > &pad_after, PrimExpr pad_value=PrimExpr(), std::string name="space_to_batch_nd", std::string tag=kInjective)
Divide spatial dimensions of the input into a grid of blocks.
Definition: nn.h:482

tvm::topi::kConv2dHWCN
constexpr auto kConv2dHWCN
Definition: tags.h:39

tvm::topi::kDepthwiseConv2dNHWC
constexpr auto kDepthwiseConv2dNHWC
Definition: tags.h:41

tvm::topi::conv2d_nchw
tvm::te::Tensor conv2d_nchw(const tvm::te::Tensor &I, const tvm::te::Tensor &W, int pad_h=0, int pad_w=0, int stride_h=1, int stride_w=1, std::string name="T_conv2d_nchw", std::string tag=kConv2dNCHW)
Creates an operation that performs a 2-D convolution with an NCHW-layout.
Definition: nn.h:268

tvm::topi::sum
Tensor sum(const Tensor &data, const Array< Integer > &axis, bool keepdims=false, bool atleast1d=false)
Creates an operation that sums array elements over a given axis.
Definition: reduction.h:326

tvm::topi::conv2d_hwcn
tvm::te::Tensor conv2d_hwcn(const tvm::te::Tensor &I, const tvm::te::Tensor &W, int pad_h=0, int pad_w=0, int stride_h=1, int stride_w=1, std::string name="T_conv2d_hwcn", std::string tag=kConv2dHWCN)
Creates an operation for 2-D convolution layer with an HWCN-layout.
Definition: nn.h:312

tvm::topi::relu
tvm::te::Tensor relu(const tvm::te::Tensor &t, T threshold=static_cast< T >(0), std::string name="T_relu", std::string tag=kElementWise)
Creates an operation that performs a rectified linear unit.
Definition: nn.h:55

tvm::topi::nll_loss
Tensor nll_loss(const Tensor &predictions, const Tensor &targets, const Tensor &weights, std::string reduction="mean", int ignore_index=-100, const std::string name="nll_loss", const std::string tag=kBroadcast)
Negative log likelihood loss.
Definition: nn.h:660

tvm::topi::shape
Tensor shape(const Tensor &src, DataType dtype, const std::string name="T_shape", const std::string tag=kInjective)
Get the shape of input tensor.
Definition: transform.h:1913

tvm::topi::depthwise_conv2d_nhwc
tvm::te::Tensor depthwise_conv2d_nhwc(const tvm::te::Tensor &I, const tvm::te::Tensor &W, int pad_h=0, int pad_w=0, int stride_h=1, int stride_w=1, std::string name="T_depthwise_conv2d_nhwc", std::string tag=kDepthwiseConv2dNHWC)
Definition: nn.h:385

tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:36

tvm::div
PrimExpr div(PrimExpr a, PrimExpr b, Span span=Span())
compute division in C semantics.

tvm::logical_and
PrimExpr logical_and(PrimExpr a, PrimExpr b, Span span=Span())
and

tvm::if_then_else
PrimExpr if_then_else(PrimExpr cond, PrimExpr true_value, PrimExpr false_value, Span span=Span())
Conditional expression.

tvm::cast
PrimExpr cast(const DataType &t, PrimExpr value, Span span=Span())
cast value to type.

tvm::indexdiv
PrimExpr indexdiv(PrimExpr a, PrimExpr b, Span span=Span())
compute floor(a / b) where a and b are non-negative.

tvm::indexmod
PrimExpr indexmod(PrimExpr a, PrimExpr b, Span span=Span())
compute the remainder floor(a / b) where a and b are non-negative.

tvm::sum
PrimExpr sum(PrimExpr source, Array< tir::IterVar > axis, Array< PrimExpr > init={}, Span span=Span())
sum of source expression over axis

operation.h
Operation node can generate one or multiple Tensors.

reduction.h
Reduction op constructors.

tags.h
External function interface to rocBLAS libraries.

expr.h
TIR expressions.

op.h
Common operators defined for Expr.

transform.h
Transform op constructors.