api/doxygen/nn_2softmax_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_TOPI_NN_SOFTMAX_H_

 #define TVM_TOPI_NN_SOFTMAX_H_


 #include <tvm/te/operation.h>

 #include <tvm/topi/reduction.h>

 #include <tvm/topi/tags.h>


 #include <algorithm>

 #include <string>


 namespace tvm {

 namespace topi {

 namespace nn {


 using namespace tvm::te;


 inline Tensor softmax(const Tensor& x, int axis = -1, std::string name = "tensor",

                       std::string tag = "softmax_output") {

   auto input_shape = x->shape;

   auto ndim = input_shape.size();

   if (axis < 0) {

     axis = ndim + axis;

   }

   ICHECK_LT(axis, ndim) << "axis parameter should be less than input dim";


   auto k1 = tvm::te::reduce_axis(Range(0, input_shape[axis]), "k1");

   auto k2 = tvm::te::reduce_axis(Range(0, input_shape[axis]), "k2");

   auto reduced_shape = MakeReduceTargetShape({axis}, x, false, false);


   tvm::Map<String, ObjectRef> attrs;

   attrs.Set("axis", Integer(axis));


   auto insert_reduce_index = [axis, ndim](const Array<Var>& indices, const IterVar& reduce_index) {

     Array<PrimExpr> eval_range;

     int arg_counter = 0;

     for (size_t i = 0; i < ndim; ++i) {

       if (static_cast<int>(i) == axis) {

         eval_range.push_back(reduce_index);

       } else {

         eval_range.push_back(indices[arg_counter++]);

       }

     }

     return eval_range;

   };


   auto get_non_reduce_indices = [axis, ndim](const Array<Var>& indices) {

     Array<PrimExpr> non_reduce_indices;

     for (size_t i = 0; i < ndim; ++i) {

       if (static_cast<int>(i) != axis) non_reduce_indices.push_back(indices[i]);

     }

     return non_reduce_indices;

   };


   auto _compute_max = [&](const Array<Var>& indices) {

     auto eval_range = insert_reduce_index(indices, k1);

     return topi::MaxOp(x(eval_range), {k1});

   };


   auto _compute_exp = [&](const Tensor& max_elem, const Array<Var>& indices) {

     auto non_reduce_indices = get_non_reduce_indices(indices);

     return tvm::exp(x(indices) - max_elem(non_reduce_indices));

   };


   auto _compute_expsum = [&](const Tensor& exp, const Array<Var>& indices) {

     auto eval_range = insert_reduce_index(indices, k2);

     return tvm::sum(exp(eval_range), {k2});

   };


   auto _normalize = [&](const Tensor& exp, const Tensor& expsum, const Array<Var>& indices) {

     auto non_reduce_indices = get_non_reduce_indices(indices);

     return exp(indices) / expsum(non_reduce_indices);

   };


   auto max_elem = tvm::te::compute(reduced_shape, _compute_max);

   auto exp = tvm::te::compute(

       input_shape, [&](const Array<Var>& indices) { return _compute_exp(max_elem, indices); });

   auto expsum = tvm::te::compute(

       reduced_shape, [&](const Array<Var>& indices) { return _compute_expsum(exp, indices); });

   return tvm::te::compute(

       input_shape, [&](const Array<Var>& indices) { return _normalize(exp, expsum, indices); },

       name, tag, attrs);

 }


 inline Tensor log_softmax(const Tensor& x, std::string name = "tensor",

                           std::string tag = "log_softmax_output") {

   ICHECK_EQ(x->shape.size(), 2) << "Log softmax requires 2-D input";


   PrimExpr m = x->shape[0];

   PrimExpr n = x->shape[1];


   auto k = tvm::te::reduce_axis(Range(0, n), "k");

   auto max_elem =

       tvm::te::compute({m}, [&](Var i) { return tvm::max(x(i, k), Array<IterVar>{k}); });

   k = tvm::te::reduce_axis(Range(0, n), "k");


   auto expsum =

       tvm::te::compute({m}, [&](Var i) { return tvm::sum(tvm::exp(x(i, k) - max_elem(i)), {k}); });


   return tvm::te::compute(

       x->shape, [&](Var i, Var j) { return x(i, j) - max_elem(i) - tvm::log(expsum(i)); }, name,

       tag);

 }


 }  // namespace nn

 }  // namespace topi

 }  // namespace tvm

 #endif  // TVM_TOPI_NN_SOFTMAX_H_

tvm::Integer
Container of constant int that adds more constructors.
Definition: expr.h:632

tvm::PrimExpr
Reference to PrimExprNode.
Definition: expr.h:115

tvm::Range
Range container
Definition: expr.h:725

tvm::runtime::Array
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289

tvm::runtime::Array::push_back
void push_back(const T &item)
push a new item to the back of the list
Definition: array.h:457

tvm::runtime::Map
Map container of NodeRef->NodeRef in DSL graph. Map implements copy on write semantics,...
Definition: map.h:1271

tvm::runtime::Map::Set
void Set(const K &key, const V &value)
set the Map.
Definition: map.h:1374

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102

tvm::tir::IterVar
Iteration Variable, represents an iteration over an integer interval.
Definition: var.h:315

tvm::tir::Var
a named variable in TIR
Definition: var.h:89

tvm::te
Tensor expression language DSL.
Definition: extracted_task.h:33

tvm::te::reduce_axis
IterVar reduce_axis(Range dom, std::string name="rv")
Create a new IterVar for reduction operations.

tvm::te::compute
Tensor compute(Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", Map< String, ObjectRef > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...

tvm::topi::nn::softmax
Tensor softmax(const Tensor &x, int axis=-1, std::string name="tensor", std::string tag="softmax_output")
Softmax activation.
Definition: softmax.h:50

tvm::topi::nn::log_softmax
Tensor log_softmax(const Tensor &x, std::string name="tensor", std::string tag="log_softmax_output")
Log softmax activation.
Definition: softmax.h:126

tvm::topi::MaxOp
PrimExpr MaxOp(PrimExpr source, Array< IterVar > axis, Array< PrimExpr > init={}, Span span=Span())
Wrap tvm::max to ensure we get the correct overload.
Definition: reduction.h:302

tvm::topi::exp
Tensor exp(const Tensor &x, std::string name="T_" "exp", std::string tag=kElementWise)
Definition: elemwise.h:50

tvm::topi::MakeReduceTargetShape
Array< PrimExpr > MakeReduceTargetShape(const std::vector< int > &real_axis, const Tensor &data, bool keepdims, bool atleast1d)
Calculate the target shape for a reduce op.
Definition: reduction.h:99

tvm
runtime implementation for LibTorch/TorchScript.
Definition: analyzer.h:36

tvm::max
PrimExpr max(PrimExpr a, PrimExpr b, Span span=Span())
take maximum of two values

tvm::exp
PrimExpr exp(PrimExpr x, Span span=Span())
Definition: op.h:706

tvm::sum
PrimExpr sum(PrimExpr source, Array< tir::IterVar > axis, Array< PrimExpr > init={}, Span span=Span())
sum of source expression over axis

operation.h
Operation node can generate one or multiple Tensors.

reduction.h
Reduction op constructors.

tags.h
External function interface to rocBLAS libraries.