tvm
elemwise.h
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  * http://www.apache.org/licenses/LICENSE-2.0
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
14  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
19 
24 #ifndef TVM_TOPI_ELEMWISE_H_
25 #define TVM_TOPI_ELEMWISE_H_
26 
27 #include <tvm/tir/builtin.h>
28 #include <tvm/tir/expr.h>
29 #include <tvm/tir/op.h>
30 #include <tvm/topi/tags.h>
31 
32 #include <algorithm>
33 #include <string>
34 
35 #include "broadcast.h"
36 
37 namespace tvm {
38 namespace topi {
39 
40 using namespace tvm::te;
41 
42 // Unary intrinsic operators
43 #define TOPI_DECLARE_UNARY_OP(OpName) \
44  inline Tensor OpName(const Tensor& x, std::string name = "T_" #OpName, \
45  std::string tag = kElementWise) { \
46  return compute( \
47  x->shape, [&](const Array<Var>& i) { return ::tvm::OpName(x(i)); }, name, tag); \
48  }
49 
77 
82 inline Tensor fast_tanh_float(const Tensor& in, std::string name, std::string tag) {
83  // Clamp the inputs to the range [-9, 9] since anything outside
84  // this range is +/-1.0f in single-precision.
85  auto x = maximum(make_const(in->dtype, -9.0), minimum(make_const(in->dtype, 9.0), in));
86 
87  // The monomial coefficients of the numerator polynomial (odd).
88  auto alpha_1 = make_const(in->dtype, 4.89352455891786e-03);
89  auto alpha_3 = make_const(in->dtype, 6.37261928875436e-04);
90  auto alpha_5 = make_const(in->dtype, 1.48572235717979e-05);
91  auto alpha_7 = make_const(in->dtype, 5.12229709037114e-08);
92  auto alpha_9 = make_const(in->dtype, -8.60467152213735e-11);
93  auto alpha_11 = make_const(in->dtype, 2.00018790482477e-13);
94  auto alpha_13 = make_const(in->dtype, -2.76076847742355e-16);
95 
96  // The monomial coefficients of the denominator polynomial (even).
97  auto beta_0 = make_const(in->dtype, 4.89352518554385e-03);
98  auto beta_2 = make_const(in->dtype, 2.26843463243900e-03);
99  auto beta_4 = make_const(in->dtype, 1.18534705686654e-04);
100  auto beta_6 = make_const(in->dtype, 1.19825839466702e-06);
101 
102  return compute(
103  x->shape,
104  [&](const Array<Var>& i) {
105  auto x2 = x(i) * x(i);
106  auto p = x2 * alpha_13 + alpha_11;
107  p = x2 * p + alpha_9;
108  p = x2 * p + alpha_7;
109  p = x2 * p + alpha_5;
110  p = x2 * p + alpha_3;
111  p = x2 * p + alpha_1;
112  p = x(i) * p;
113 
114  auto q = x2 * beta_6 + beta_4;
115  q = x2 * q + beta_2;
116  q = x2 * q + beta_0;
117  return p / q;
118  },
119  name, tag);
120 }
121 
131 inline Tensor fast_tanh(const Tensor& x, std::string name = "T_fast_tanh",
132  std::string tag = kElementWise) {
133  if (x->dtype == DataType::Float(32)) {
134  // invoke fast_tanh_float implementation
135  return fast_tanh_float(x, name, tag);
136  } else {
137  // fallback to default implementation
138  return compute(
139  x->shape, [&](const Array<Var>& i) { return ::tvm::tanh(x(i)); }, name, tag);
140  }
141 }
142 
152 inline Tensor identity(const Tensor& x, std::string name = "T_identity",
153  std::string tag = kElementWise) {
154  return compute(
155  x->shape, [&](const Array<Var>& i) { return x(i); }, name, tag);
156 }
157 
167 inline Tensor negative(const Tensor& x, std::string name = "T_negative",
168  std::string tag = kElementWise) {
169  return compute(
170  x->shape, [&](const Array<Var>& i) { return -x(i); }, name, tag);
171 }
172 
182 inline Tensor logical_not(const Tensor& x, std::string name = "T_logical_not",
183  std::string tag = kElementWise) {
184  return compute(
185  x->shape, [&](const Array<Var>& i) { return !x(i); }, name, tag);
186 }
187 
197 inline Tensor bitwise_not(const Tensor& x, std::string name = "T_bitwise_not",
198  std::string tag = kElementWise) {
199  return compute(
200  x->shape, [&](const Array<Var>& i) { return ~x(i); }, name, tag);
201 }
202 
212 inline Tensor sign(const Tensor& x, std::string name = "T_sign", std::string tag = kElementWise) {
213  return compute(
214  x->shape,
215  [&](const Array<Var>& i) {
216  PrimExpr zero = make_zero(x->dtype);
217  PrimExpr one = make_const(x->dtype, 1);
218  PrimExpr minus_one = make_const(x->dtype, -1);
219  auto s1 = tvm::tir::Select((x(i) < zero), minus_one, zero);
220  auto s2 = tvm::tir::Select((x(i) > zero), one, s1);
221  return s2;
222  },
223  name, tag);
224 }
225 
235 inline Tensor rsqrt(const Tensor& x, std::string name = "tensor", std::string tag = kElementWise) {
236  return compute(
237  x->shape,
238  [&](const Array<Var>& i) {
239  PrimExpr one = make_const(x->dtype, 1);
240  return one / tvm::sqrt(x(i));
241  },
242  name, tag);
243 }
244 
257 inline Tensor clip(const Tensor& x, const PrimExpr& a_min, const PrimExpr& a_max,
258  std::string name = "T_clip", std::string tag = kElementWise) {
259  return compute(
260  x->shape,
261  [&](const Array<Var>& i) {
262  auto min_val = tvm::cast(x->dtype, a_min);
263  auto max_val = tvm::cast(x->dtype, a_max);
264  return tvm::max(tvm::min(x(i), max_val), min_val); // NOLINT(*)
265  },
266  name, tag);
267 }
268 
281 inline Tensor cast(const Tensor& x, DataType type, std::string name = "T_cast",
282  std::string tag = kElementWise) {
283  return compute(
284  x->shape,
285  [&](const Array<Var>& i) -> PrimExpr {
286  auto expr = x(i);
287  if (expr.dtype().code() == type.code() && expr.dtype().bits() == type.bits()) {
288  if (expr.dtype().lanes() == type.lanes()) {
289  return expr;
290  } else if (expr.dtype().lanes() == 1 && type.is_vector()) {
291  return tvm::tir::Broadcast(expr, type.lanes());
292  }
293  }
294 
295  return tvm::cast(type, x(i));
296  },
297  name, tag);
298 }
299 
310 inline Tensor reinterpret(const Tensor& x, DataType type, std::string name = "tensor",
311  std::string tag = kElementWise) {
312  return compute(
313  x->shape, [&](const Array<Var>& i) { return reinterpret(type, x(i)); }, name, tag);
314 }
315 
325 inline Tensor elemwise_sum(const Array<Tensor>& xs, std::string name = "T_elemwise_sum",
326  std::string tag = kElementWise) {
327  ICHECK_GT(xs.size(), 0) << "elemwise sum must have at least one input tensor.";
328  return compute(
329  xs[0]->shape,
330  [&](const Array<Var>& i) {
331  auto sum_expr = xs[0](i);
332  for (size_t j = 1; j < xs.size(); j++) {
333  sum_expr = sum_expr + xs[j](i);
334  }
335  return sum_expr;
336  },
337  name, tag);
338 }
339 
351 inline Tensor full(const Array<PrimExpr>& shape, DataType dtype, const PrimExpr fill_value,
352  std::string name = "T_full", std::string tag = kElementWise) {
353  PrimExpr ev = cast(dtype, fill_value);
354  if (!ev.defined()) {
355  LOG(ERROR) << "Can't cast fill_value to " << dtype;
356  }
357  return compute(
358  shape, [&](const Array<Var>& i) { return ev; }, name, tag);
359 }
360 
372 inline Tensor full_like(const Tensor& x, const PrimExpr fill_value,
373  std::string name = "T_full_like", std::string tag = kElementWise) {
374  PrimExpr ev = cast(x->dtype, fill_value);
375  return compute(
376  x->shape, [&](const Array<Var>& i) { return ev; }, name, tag);
377 }
378 
400 inline Tensor fast_exp_float32(const Tensor& _x, std::string name, std::string tag) {
401  auto x_hi = make_const(DataType::Float(32), 88.3762626647950f);
402  auto x_lo = make_const(DataType::Float(32), -88.3762626647949f);
403  auto log2e = make_const(DataType::Float(32), 1.44269504088896341f);
404  auto ln2 = make_const(DataType::Float(32), 0.6931471805599453f);
405  PrimExpr p[6] = {make_const(DataType::Float(32), 1.9875691500E-4f),
406  make_const(DataType::Float(32), 1.3981999507E-3f),
407  make_const(DataType::Float(32), 8.3334519073E-3f),
408  make_const(DataType::Float(32), 4.1665795894E-2f),
409  make_const(DataType::Float(32), 1.6666665459E-1f),
410  make_const(DataType::Float(32), 5.0000001201E-1f)};
411  auto one = make_const(DataType::Float(32), 1.0f);
412  auto one_half = make_const(DataType::Float(32), 0.5f);
413  auto b = make_const(DataType::Float(32), 127.0f);
414 
415  return compute(
416  _x->shape,
417  [&](const Array<Var>& i) {
418  // clamp x
419  auto x = ::tvm::max(::tvm::min(_x(i), x_hi), x_lo);
420  // integer part
421  auto n = ::tvm::floor(x * log2e + one_half);
422  // fractional part
423  auto f = x - n * ln2;
424  auto y =
425  (((((p[0] * f + p[1]) * f + p[2]) * f + p[3]) * f + p[4]) * f + p[5]) * f * f + f + one;
426  // Return 2^m * exp(r).
427  auto ef =
428  tvm::reinterpret(DataType::Float(32), ::tvm::cast(DataType::Int(32), n + b) << 23);
429  return ::tvm::max(ef * y, _x(i)); // NOLINT(*)
430  },
431  name, tag);
432 }
433 
444 inline Tensor fast_exp(const Tensor& x, std::string name = "T_fast_exp",
445  std::string tag = kElementWise) {
446  if (x->dtype == DataType::Float(32)) {
447  auto ret = fast_exp_float32(x, name, tag);
448  return ret;
449  } else {
450  return compute(
451  x->shape, [&](const Array<Var>& i) { return ::tvm::exp(x(i)); }, name, tag);
452  }
453 }
454 
458 inline Tensor fast_erf_float32(const Tensor& data, std::string name, std::string tag) {
459  return compute(
460  data->shape, [&](const Array<Var>& i) { return fast_erf_float_expr(data(i), 32); }, name,
461  tag);
462 }
463 
467 inline Tensor fast_erf_float16(const Tensor& data, std::string name, std::string tag) {
468  return compute(
469  data->shape, [&](const Array<Var>& i) { return fast_erf_float_expr(data(i), 16); }, name,
470  tag);
471 }
472 
482 inline Tensor fast_erf(const Tensor& x, std::string name = "T_fast_erf",
483  std::string tag = kElementWise) {
484  if (x->dtype == DataType::Float(32)) {
485  auto ret = fast_erf_float32(x, name, tag);
486  return ret;
487  } else if (x->dtype == DataType::Float(16)) {
488  auto ret = fast_erf_float16(x, name, tag);
489  return ret;
490  } else {
491  return topi::erf(x);
492  }
493 }
494 
495 } // namespace topi
496 } // namespace tvm
497 #endif // TVM_TOPI_ELEMWISE_H_
Reference to PrimExprNode.
Definition: expr.h:115
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289
size_t size() const
Definition: array.h:420
Runtime primitive data type.
Definition: data_type.h:43
static DataType Float(int bits, int lanes=1)
Construct an float type.
Definition: data_type.h:236
bool defined() const
Definition: object.h:552
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102
Detail broadcast.
#define TOPI_DECLARE_UNARY_OP(OpName)
Definition: elemwise.h:43
Tensor expression language DSL.
Definition: extracted_task.h:33
Tensor compute(Array< PrimExpr > shape, FCompute fcompute, std::string name="tensor", std::string tag="", Map< String, ObjectRef > attrs={})
Construct a new tensor by computing over shape, using the computation rule: result_tensor[axis] = fco...
PrimExpr make_const(DataType t, ValueType value, Span span=Span())
Make a const value with certain data type.
Definition: op.h:962
constexpr auto kElementWise
Definition: tags.h:32
Tensor clip(const Tensor &x, const PrimExpr &a_min, const PrimExpr &a_max, std::string name="T_clip", std::string tag=kElementWise)
Creates an operation that clips each element of a tensor to the interval [a_min, a_max].
Definition: elemwise.h:257
Tensor ceil(const Tensor &x, std::string name="T_" "ceil", std::string tag=kElementWise)
Definition: elemwise.h:58
Tensor isinf(const Tensor &x, std::string name="T_" "isinf", std::string tag=kElementWise)
Definition: elemwise.h:76
Tensor round(const Tensor &x, std::string name="T_" "round", std::string tag=kElementWise)
Definition: elemwise.h:59
Tensor tan(const Tensor &x, std::string name="T_" "tan", std::string tag=kElementWise)
Definition: elemwise.h:64
Tensor logical_not(const Tensor &x, std::string name="T_logical_not", std::string tag=kElementWise)
Creates an operation that returns the logical NOT of a given tensor.
Definition: elemwise.h:182
Tensor fast_erf_float32(const Tensor &data, std::string name, std::string tag)
Fast_erf_float expression from Eigen.
Definition: elemwise.h:458
Tensor reinterpret(const Tensor &x, DataType type, std::string name="tensor", std::string tag=kElementWise)
Reinterpret each element of x to the given type.
Definition: elemwise.h:310
Tensor floor(const Tensor &x, std::string name="T_" "floor", std::string tag=kElementWise)
Definition: elemwise.h:57
Tensor trunc(const Tensor &x, std::string name="T_" "trunc", std::string tag=kElementWise)
Definition: elemwise.h:60
Tensor isnan(const Tensor &x, std::string name="T_" "isnan", std::string tag=kElementWise)
Definition: elemwise.h:73
Tensor fast_erf_float16(const Tensor &data, std::string name, std::string tag)
Fast_erf_float expression from Eigen for float16.
Definition: elemwise.h:467
Tensor exp(const Tensor &x, std::string name="T_" "exp", std::string tag=kElementWise)
Definition: elemwise.h:50
Tensor acos(const Tensor &x, std::string name="T_" "acos", std::string tag=kElementWise)
Definition: elemwise.h:67
Tensor asinh(const Tensor &x, std::string name="T_" "asinh", std::string tag=kElementWise)
Definition: elemwise.h:70
Tensor log(const Tensor &x, std::string name="T_" "log", std::string tag=kElementWise)
Definition: elemwise.h:54
Tensor fast_tanh_float(const Tensor &in, std::string name, std::string tag)
Fast_tanh_float implementation from Eigen https://github.com/eigenteam/eigen-git-mirror/blob/master/E...
Definition: elemwise.h:82
Tensor full(const Array< PrimExpr > &shape, DataType dtype, const PrimExpr fill_value, std::string name="T_full", std::string tag=kElementWise)
Creates an operation that fill a tensor with fill_value.
Definition: elemwise.h:351
Tensor fast_tanh(const Tensor &x, std::string name="T_fast_tanh", std::string tag=kElementWise)
Creates an operation that returns hyperbolic tanh of a given tensor.
Definition: elemwise.h:131
Tensor fast_erf(const Tensor &x, std::string name="T_fast_erf", std::string tag=kElementWise)
Fast erf implementation.
Definition: elemwise.h:482
Tensor cos(const Tensor &x, std::string name="T_" "cos", std::string tag=kElementWise)
Definition: elemwise.h:62
tvm::PrimExpr minimum(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:354
Tensor cast(const Tensor &x, DataType type, std::string name="T_cast", std::string tag=kElementWise)
Cast each element of x to the given type. If expr is scalar and type is a corresponding vector type,...
Definition: elemwise.h:281
Tensor sqrt(const Tensor &x, std::string name="T_" "sqrt", std::string tag=kElementWise)
Definition: elemwise.h:53
Tensor rsqrt(const Tensor &x, std::string name="tensor", std::string tag=kElementWise)
Creates an operation that returns rsqrt of a given tensor.
Definition: elemwise.h:235
Tensor abs(const Tensor &x, std::string name="T_" "abs", std::string tag=kElementWise)
Definition: elemwise.h:61
Tensor elemwise_sum(const Array< Tensor > &xs, std::string name="T_elemwise_sum", std::string tag=kElementWise)
Creates an operation that sum each element of a tensor.
Definition: elemwise.h:325
Tensor asin(const Tensor &x, std::string name="T_" "asin", std::string tag=kElementWise)
Definition: elemwise.h:69
Tensor bitwise_not(const Tensor &x, std::string name="T_bitwise_not", std::string tag=kElementWise)
Creates an operation that returns the bitwise NOT of a given tensor.
Definition: elemwise.h:197
Tensor atan(const Tensor &x, std::string name="T_" "atan", std::string tag=kElementWise)
Definition: elemwise.h:71
Tensor atanh(const Tensor &x, std::string name="T_" "atanh", std::string tag=kElementWise)
Definition: elemwise.h:72
Tensor log10(const Tensor &x, std::string name="T_" "log10", std::string tag=kElementWise)
Definition: elemwise.h:56
Tensor sigmoid(const Tensor &x, std::string name="T_" "sigmoid", std::string tag=kElementWise)
Definition: elemwise.h:52
Tensor identity(const Tensor &x, std::string name="T_identity", std::string tag=kElementWise)
Creates an operation that returns identity of a given tensor.
Definition: elemwise.h:152
Tensor isfinite(const Tensor &x, std::string name="T_" "isfinite", std::string tag=kElementWise)
Definition: elemwise.h:75
Tensor log2(const Tensor &x, std::string name="T_" "log2", std::string tag=kElementWise)
Definition: elemwise.h:55
Tensor cosh(const Tensor &x, std::string name="T_" "cosh", std::string tag=kElementWise)
Definition: elemwise.h:63
Tensor acosh(const Tensor &x, std::string name="T_" "acosh", std::string tag=kElementWise)
Definition: elemwise.h:68
Tensor sin(const Tensor &x, std::string name="T_" "sin", std::string tag=kElementWise)
Definition: elemwise.h:65
Tensor tanh(const Tensor &x, std::string name="T_" "tanh", std::string tag=kElementWise)
Definition: elemwise.h:74
Tensor full_like(const Tensor &x, const PrimExpr fill_value, std::string name="T_full_like", std::string tag=kElementWise)
Creates an operation that construct a tensor with same shape as input tensor, then fill a tensor with...
Definition: elemwise.h:372
Tensor erf(const Tensor &x, std::string name="T_" "erf", std::string tag=kElementWise)
Definition: elemwise.h:51
Tensor fast_exp(const Tensor &x, std::string name="T_fast_exp", std::string tag=kElementWise)
Fast exponential function implementation.
Definition: elemwise.h:444
Tensor shape(const Tensor &src, DataType dtype, const std::string name="T_shape", const std::string tag=kInjective)
Get the shape of input tensor.
Definition: transform.h:1913
Tensor sign(const Tensor &x, std::string name="T_sign", std::string tag=kElementWise)
Returns the sign of the tensor.
Definition: elemwise.h:212
Tensor negative(const Tensor &x, std::string name="T_negative", std::string tag=kElementWise)
Creates an operation that returns the negation of a given tensor.
Definition: elemwise.h:167
Tensor sinh(const Tensor &x, std::string name="T_" "sinh", std::string tag=kElementWise)
Definition: elemwise.h:66
tvm::PrimExpr maximum(const tvm::PrimExpr &a, const tvm::PrimExpr &b)
Definition: broadcast.h:341
Tensor fast_exp_float32(const Tensor &_x, std::string name, std::string tag)
Fast exponential function implementation.
Definition: elemwise.h:400
runtime implementation for LibTorch/TorchScript.
Definition: analyzer.h:36
PrimExpr ret(PrimExpr value, Span span=Span())
Return the value.
PrimExpr cast(const DataType &t, PrimExpr value, Span span=Span())
cast value to type.
External function interface to rocBLAS libraries.
TIR builtin intrinsics.
TIR expressions.
Common operators defined for Expr.