api/doxygen/instance__norm_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_TOPI_NN_INSTANCE_NORM_H_

 #define TVM_TOPI_NN_INSTANCE_NORM_H_


 #include <tvm/te/operation.h>

 #include <tvm/topi/tags.h>


 #include <string>


 namespace tvm {

 namespace topi {

 namespace nn {


 using namespace tvm::te;


 inline Tensor instance_norm(const Tensor& data, const Tensor& gamma, const Tensor& beta,

                             int channel_axis, const ffi::Array<Integer>& axis, double epsilon,

                             std::string name = "T_instance_norm", std::string tag = kInjective) {

   const auto& data_type = data->dtype;

   const auto& gamma_type = gamma.defined() ? gamma->dtype : data_type;

   const auto& beta_type = beta.defined() ? beta->dtype : data_type;

   ICHECK(data_type == gamma_type && data_type == beta_type)

       << "instance_norm: data, gamma and beta must have the same type";

   ICHECK(data_type == DataType::Float(32) || data_type == DataType::Float(16))

       << "instance_norm: only support float32 and float16 for now";

   bool is_float16 = data_type == DataType::Float(16);

   // sum x and x^2

   auto ndim = data->shape.size();

   ICHECK_NE(ndim, 0) << "Cannot reduce a 0 dim Tensor";

   auto real_axis = GetRealAxis(static_cast<int>(ndim), axis);

   auto reduce_axes = MakeReduceAxes(real_axis, data);

   auto target_shape =

       MakeReduceTargetShape(real_axis, data, /*keepdims=*/false, /*atleast1d=*/true);

   auto func = MakeTupleSumReducer();


   auto compute = [ndim, is_float16, &real_axis, &reduce_axes, &func,

                   &data](const ffi::Array<Var>& indices) {

     ffi::Array<PrimExpr> eval_range;

     int arg_counter = 0;

     int red_counter = 0;


     for (size_t i = 0; i < ndim; ++i) {

       if (std::find(real_axis.begin(), real_axis.end(), i) != real_axis.end()) {

         // real_axis contains i

         eval_range.push_back(reduce_axes[red_counter]);

         red_counter++;

       } else {

         eval_range.push_back(indices[arg_counter]);

         arg_counter++;

       }

     }

     auto square = [is_float16](const PrimExpr& x) {

       if (is_float16) {

         return Cast(DataType::Float(32), x) * Cast(DataType::Float(32), x);

       }

       return x * x;

     };

     if (is_float16) {

       return func({Cast(DataType::Float(32), data(eval_range)), square(data(eval_range))},

                   reduce_axes, nullptr);

     } else {

       return func({data(eval_range), square(data(eval_range))}, reduce_axes, nullptr);

     }

   };


   auto temp_x_x2 =

       tvm::te::compute(target_shape, compute, data->op->name + "_red_temp", kCommReduce);


   auto temp_x = temp_x_x2[0];

   auto temp_x2 = temp_x_x2[1];


   auto reduce_extent = make_const(data->dtype, 1);

   for (int i : real_axis) {

     reduce_extent *= data->shape[i];

   }

   auto instance_norm_func = [&](const ffi::Array<Var>& indices) {

     ffi::Array<Var> reduce_indices, non_reduce_indices;


     for (int i = 0, n = static_cast<int>(indices.size()); i < n; ++i) {

       if (std::find(real_axis.begin(), real_axis.end(), i) != real_axis.end()) {

         reduce_indices.push_back(indices[i]);

       } else {

         non_reduce_indices.push_back(indices[i]);

       }

     }

     Var channel;

     channel = indices[channel_axis];

     auto mean = temp_x(non_reduce_indices) / reduce_extent;

     auto var = temp_x2(non_reduce_indices) / reduce_extent - mean * mean;

     auto instance_norm = (data(indices) - mean) * tvm::rsqrt(var + make_const(var->dtype, epsilon));

     if (is_float16) {

       instance_norm = Cast(DataType::Float(16), instance_norm);

     }

     instance_norm = topi::multiply(instance_norm, gamma(channel));

     if (beta.defined()) {

       instance_norm = topi::add(instance_norm, beta(channel));

     }

     return instance_norm;

   };

   return tvm::te::compute(data->shape, instance_norm_func, name, tag);

 }


 }  // namespace nn

 }  // namespace topi

 }  // namespace tvm


 #endif  // TVM_TOPI_NN_INSTANCE_NORM_H_

tvm::PrimExprNode::dtype
DataType dtype
The runtime data type of the primitive expression.
Definition: expr.h:107

tvm::PrimExpr
Reference to PrimExprNode.
Definition: expr.h:124

tvm::runtime::DataType::Float
static DataType Float(int bits, int lanes=1)
Construct an float type.
Definition: data_type.h:294

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:100

tvm::tir::Cast
Managed reference to CastNode.
Definition: expr.h:96

tvm::tir::Var
a named variable in TIR
Definition: var.h:77

tvm::te
Tensor expression language DSL.
Definition: extracted_task.h:33

tvm::te::compute
Tensor compute(ffi::Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", ffi::Map< ffi::String, ffi::Any > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...

tvm::te::var
Var var(std::string name_hint, DataType t=DataType::Int(32))
Construct a new Var expression.

tvm::tir::make_const
PrimExpr make_const(DataType t, ValueType value, Span span=Span())
Make a const value with certain data type.
Definition: op.h:994

tvm::topi::nn::instance_norm
Tensor instance_norm(const Tensor &data, const Tensor &gamma, const Tensor &beta, int channel_axis, const ffi::Array< Integer > &axis, double epsilon, std::string name="T_instance_norm", std::string tag=kInjective)
Instance normalization.
Definition: instance_norm.h:53

tvm::topi::GetRealAxis
std::vector< int > GetRealAxis(int ndim, const ffi::Optional< ffi::Array< Integer >> &axis)
Convert a reduction axis which could be empty or have negative elements into a real axis with valid d...
Definition: reduction.h:65

tvm::topi::MakeTupleSumReducer
FCommReduce MakeTupleSumReducer()
Create communitive reducer summing over tuples.
Definition: reduction.h:591

tvm::topi::MakeReduceTargetShape
ffi::Array< PrimExpr > MakeReduceTargetShape(const std::vector< int > &real_axis, const Tensor &data, bool keepdims, bool atleast1d)
Calculate the target shape for a reduce op.
Definition: reduction.h:99

tvm::topi::kInjective
constexpr auto kInjective
Definition: tags.h:33

tvm::topi::MakeReduceAxes
ffi::Array< IterVar > MakeReduceAxes(const std::vector< int > &real_axis, const Tensor &data)
Enumerate the axes for a reduce op.
Definition: reduction.h:89

tvm::topi::multiply
tvm::PrimExpr multiply(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:227

tvm::topi::kCommReduce
constexpr auto kCommReduce
Definition: tags.h:34

tvm::topi::add
tvm::PrimExpr add(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:199

tvm
Performance counters for profiling via the PAPI library.
Definition: analyzer.h:37

tvm::rsqrt
PrimExpr rsqrt(PrimExpr x, Span span=Span())
Definition: op.h:745

operation.h
Operation node can generate one or multiple Tensors.

tags.h
External function interface to rocBLAS libraries.