tvm
All Classes Namespaces Files Functions Variables Typedefs Enumerations Enumerator Friends Macros
layer_norm.h
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  * http://www.apache.org/licenses/LICENSE-2.0
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
14  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
19 
24 #ifndef TVM_TOPI_NN_LAYER_NORM_H_
25 #define TVM_TOPI_NN_LAYER_NORM_H_
26 
27 #include <tvm/te/operation.h>
28 #include <tvm/topi/tags.h>
29 
30 #include <string>
31 
32 namespace tvm {
33 namespace topi {
34 namespace nn {
35 
36 using namespace tvm::te;
37 
51 inline Tensor layer_norm(const Tensor& data, const Tensor& gamma, const Tensor& beta,
52  const Array<Integer>& axis, double epsilon,
53  std::string name = "T_layer_norm", std::string tag = kInjective) {
54  // sum x and x^2
55  auto ndim = data->shape.size();
56  ICHECK_NE(ndim, 0) << "Cannot reduce a 0 dim Tensor";
57  auto real_axis = GetRealAxis(static_cast<int>(ndim), axis);
58  auto reduce_axes = MakeReduceAxes(real_axis, data);
59  auto target_shape =
60  MakeReduceTargetShape(real_axis, data, /*keepdims=*/false, /*atleast1d=*/true);
61  auto func = MakeTupleSumReducer();
62 
63  auto compute = [ndim, &real_axis, &reduce_axes, &func, &data](const Array<Var>& indices) {
64  Array<PrimExpr> eval_range;
65  int arg_counter = 0;
66  int red_counter = 0;
67 
68  for (size_t i = 0; i < ndim; ++i) {
69  if (std::find(real_axis.begin(), real_axis.end(), i) != real_axis.end()) {
70  // real_axis contains i
71  eval_range.push_back(reduce_axes[red_counter]);
72  red_counter++;
73  } else {
74  eval_range.push_back(indices[arg_counter]);
75  arg_counter++;
76  }
77  }
78  auto square = [](const PrimExpr& x) { return x * x; };
79  return func({data(eval_range), square(data(eval_range))}, reduce_axes, nullptr);
80  };
81 
82  auto temp_x_x2 =
83  tvm::te::compute(target_shape, compute, data->op->name + "_red_temp", kCommReduce);
84 
85  auto temp_x = temp_x_x2[0];
86  auto temp_x2 = temp_x_x2[1];
87 
88  auto reduce_extent = make_const(data->dtype, 1);
89  for (int i : real_axis) {
90  reduce_extent *= data->shape[i];
91  }
92  auto layer_norm_func = [&](const Array<Var>& indices) {
93  Array<Var> reduce_indices, non_reduce_indices;
94  for (int i = 0, n = static_cast<int>(indices.size()); i < n; ++i) {
95  if (std::find(real_axis.begin(), real_axis.end(), i) != real_axis.end()) {
96  reduce_indices.push_back(indices[i]);
97  } else {
98  non_reduce_indices.push_back(indices[i]);
99  }
100  }
101  auto mean = temp_x(non_reduce_indices) / reduce_extent;
102  auto var = temp_x2(non_reduce_indices) / reduce_extent - mean * mean;
103  auto layer_norm = (data(indices) - mean) * tvm::rsqrt(var + make_const(var->dtype, epsilon));
104  layer_norm = topi::multiply(layer_norm, gamma(reduce_indices));
105  if (beta.defined()) {
106  layer_norm = topi::add(layer_norm, beta(reduce_indices));
107  }
108  return layer_norm;
109  };
110  return tvm::te::compute(data->shape, layer_norm_func, name, tag);
111 }
112 
113 } // namespace nn
114 } // namespace topi
115 } // namespace tvm
116 
117 #endif // TVM_TOPI_NN_LAYER_NORM_H_
DataType dtype
The runtime data type of the primitive expression.
Definition: expr.h:101
Reference to PrimExprNode.
Definition: expr.h:114
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289
void push_back(const T &item)
push a new item to the back of the list
Definition: array.h:457
bool defined() const
Definition: object.h:550
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102
Tensor expression language DSL.
Definition: extracted_task.h:33
Var var(std::string name_hint, DataType t=DataType::Int(32))
Construct a new Var expression.
Tensor compute(Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", Map< String, ObjectRef > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...
PrimExpr make_const(DataType t, ValueType value, Span span=Span())
Make a const value with certain data type.
Definition: op.h:961
Tensor layer_norm(const Tensor &data, const Tensor &gamma, const Tensor &beta, const Array< Integer > &axis, double epsilon, std::string name="T_layer_norm", std::string tag=kInjective)
Layer normalization.
Definition: layer_norm.h:51
FCommReduce MakeTupleSumReducer()
Create communitive reducer summing over tuples.
Definition: reduction.h:587
constexpr auto kInjective
Definition: tags.h:33
tvm::PrimExpr multiply(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:225
constexpr auto kCommReduce
Definition: tags.h:34
Array< IterVar > MakeReduceAxes(const std::vector< int > &real_axis, const Tensor &data)
Enumerate the axes for a reduce op.
Definition: reduction.h:89
std::vector< int > GetRealAxis(int ndim, const Array< Integer > &axis)
Convert a reduction axis which could be empty or have negative elements into a real axis with valid d...
Definition: reduction.h:65
tvm::PrimExpr add(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:197
Array< PrimExpr > MakeReduceTargetShape(const std::vector< int > &real_axis, const Tensor &data, bool keepdims, bool atleast1d)
Calculate the target shape for a reduce op.
Definition: reduction.h:99
runtime implementation for LibTorch/TorchScript.
Definition: analyzer.h:36
PrimExpr rsqrt(PrimExpr x, Span span=Span())
Definition: op.h:712
Operation node can generate one or multiple Tensors.
External function interface to rocBLAS libraries.