api/doxygen/nn_2softmax_8h_source.html

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */

 #ifndef TVM_TOPI_NN_SOFTMAX_H_
 #define TVM_TOPI_NN_SOFTMAX_H_

 #include <tvm/te/operation.h>
 #include <tvm/topi/reduction.h>
 #include <tvm/topi/tags.h>

 #include <algorithm>
 #include <string>

 namespace tvm {
 namespace topi {
 namespace nn {

 using namespace tvm::te;

 inline Tensor softmax(const Tensor& x, int axis = -1, std::string name = "tensor",
                       std::string tag = "softmax_output") {
   auto input_shape = x->shape;
   auto ndim = input_shape.size();
   if (axis < 0) {
     axis = ndim + axis;
   }
   ICHECK_LT(axis, ndim) << "axis parameter should be less than input dim";

   auto k1 = tvm::te::reduce_axis(Range(0, input_shape[axis]), "k1");
   auto k2 = tvm::te::reduce_axis(Range(0, input_shape[axis]), "k2");
   auto reduced_shape = MakeReduceTargetShape({axis}, x, false, false);

   tvm::Map<String, ObjectRef> attrs;
   attrs.Set("axis", Integer(axis));

   auto insert_reduce_index = [axis, ndim](const Array<Var>& indices, const IterVar& reduce_index) {
     Array<PrimExpr> eval_range;
     int arg_counter = 0;
     for (size_t i = 0; i < ndim; ++i) {
       if (static_cast<int>(i) == axis)
         eval_range.push_back(reduce_index);
       else
         eval_range.push_back(indices[arg_counter++]);
     }
     return eval_range;
   };

   auto get_non_reduce_indices = [axis, ndim](const Array<Var>& indices) {
     Array<PrimExpr> non_reduce_indices;
     for (size_t i = 0; i < ndim; ++i) {
       if (static_cast<int>(i) != axis) non_reduce_indices.push_back(indices[i]);
     }
     return non_reduce_indices;
   };

   auto _compute_max = [&](const Array<Var>& indices) {
     auto eval_range = insert_reduce_index(indices, k1);
     return topi::MaxOp(x(eval_range), {k1});
   };

   auto _compute_exp = [&](const Tensor& max_elem, const Array<Var>& indices) {
     auto non_reduce_indices = get_non_reduce_indices(indices);
     return tvm::exp(x(indices) - max_elem(non_reduce_indices));
   };

   auto _compute_expsum = [&](const Tensor& exp, const Array<Var>& indices) {
     auto eval_range = insert_reduce_index(indices, k2);
     return tvm::sum(exp(eval_range), {k2});
   };

   auto _normalize = [&](const Tensor& exp, const Tensor& expsum, const Array<Var>& indices) {
     auto non_reduce_indices = get_non_reduce_indices(indices);
     return exp(indices) / expsum(non_reduce_indices);
   };

   auto max_elem = tvm::te::compute(reduced_shape, _compute_max);
   auto exp = tvm::te::compute(
       input_shape, [&](const Array<Var>& indices) { return _compute_exp(max_elem, indices); });
   auto expsum = tvm::te::compute(
       reduced_shape, [&](const Array<Var>& indices) { return _compute_expsum(exp, indices); });
   return tvm::te::compute(
       input_shape, [&](const Array<Var>& indices) { return _normalize(exp, expsum, indices); },
       name, tag, attrs);
 }

 inline Tensor log_softmax(const Tensor& x, std::string name = "tensor",
                           std::string tag = "log_softmax_output") {
   ICHECK_EQ(x->shape.size(), 2) << "Log softmax requires 2-D input";

   PrimExpr m = x->shape[0];
   PrimExpr n = x->shape[1];

   auto k = tvm::te::reduce_axis(Range(0, n), "k");
   auto max_elem =
       tvm::te::compute({m}, [&](Var i) { return tvm::max(x(i, k), Array<IterVar>{k}); });
   k = tvm::te::reduce_axis(Range(0, n), "k");

   auto expsum =
       tvm::te::compute({m}, [&](Var i) { return tvm::sum(tvm::exp(x(i, k) - max_elem(i)), {k}); });

   return tvm::te::compute(
       x->shape, [&](Var i, Var j) { return x(i, j) - max_elem(i) - tvm::log(expsum(i)); }, name,
       tag);
 }

 }  // namespace nn
 }  // namespace topi
 }  // namespace tvm
 #endif  // TVM_TOPI_NN_SOFTMAX_H_
tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:36

tvm::te
Tensor expression language DSL.
Definition: autodiff.h:35

tvm::tir::Var
a named variable in TIR
Definition: var.h:88

reduction.h
Reduction op constructors.

tvm::tir::IterVar
Iteration Variable, represents an iteration over an integer interval.
Definition: var.h:297

tvm::topi::nn::softmax
Tensor softmax(const Tensor &x, int axis=-1, std::string name="tensor", std::string tag="softmax_output")
Softmax activation.
Definition: softmax.h:50

tvm::topi::MakeReduceTargetShape
Array< PrimExpr > MakeReduceTargetShape(const std::vector< int > &real_axis, const Tensor &data, bool keepdims, bool atleast1d)
Calculate the target shape for a reduce op.
Definition: reduction.h:99

tvm::runtime::Array::push_back
void push_back(const T &item)
push a new item to the back of the list
Definition: array.h:436

tvm::topi::nn::log_softmax
Tensor log_softmax(const Tensor &x, std::string name="tensor", std::string tag="log_softmax_output")
Log softmax activation.
Definition: softmax.h:125

tvm::Range
Range constainer.
Definition: expr.h:449

tvm::topi::MaxOp
PrimExpr MaxOp(PrimExpr source, Array< IterVar > axis, Array< PrimExpr > init={}, Span span=Span())
Wrap tvm::max to ensure we get the correct overload.
Definition: reduction.h:302

tvm::sum
PrimExpr sum(PrimExpr source, Array< tir::IterVar > axis, Array< PrimExpr > init={}, Span span=Span())
sum of of source expression over axis

tvm::runtime::Array
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:270

tvm::max
PrimExpr max(PrimExpr a, PrimExpr b, Span span=Span())
take maximum of two values

tvm::te::reduce_axis
IterVar reduce_axis(Range dom, std::string name="rv")
Create a new IterVar for reduction operations.

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102

tvm::topi::exp
Tensor exp(const Tensor &x, std::string name="T_" "exp", std::string tag=kElementWise)
Definition: elemwise.h:49

operation.h
Operation node can generate one or multiple Tensors.

tvm::runtime::Map
Map container of NodeRef->NodeRef in DSL graph. Map implements copy on write semantics, which means map is mutable but copy will happen when array is referenced in more than two places.
Definition: map.h:1235

tags.h
External function interface to rocBLAS libraries.

tvm::te::compute
Tensor compute(Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", Map< String, ObjectRef > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...

tvm::exp
PrimExpr exp(PrimExpr x, Span span=Span())
Definition: op.h:844

tvm::PrimExpr
Reference to PrimExprNode.
Definition: expr.h:109

tvm::runtime::Map::Set
void Set(const K &key, const V &value)
set the Map.
Definition: map.h:1338

tvm::Integer
Container of constant int that adds more constructors.
Definition: expr.h:356