tvm
vision.h
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  * http://www.apache.org/licenses/LICENSE-2.0
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
14  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
23 #ifndef TVM_RELAX_ATTRS_VISION_H_
24 #define TVM_RELAX_ATTRS_VISION_H_
25 
26 #include <tvm/ffi/string.h>
27 #include <tvm/ir/attrs.h>
28 #include <tvm/ir/type.h>
29 #include <tvm/relax/expr.h>
30 
31 namespace tvm {
32 namespace relax {
33 
36  : public AttrsNodeReflAdapter<AllClassNonMaximumSuppressionAttrs> {
37  ffi::String output_format;
38 
39  static void RegisterReflection() {
40  namespace refl = tvm::ffi::reflection;
41  refl::ObjectDef<AllClassNonMaximumSuppressionAttrs>().def_ro(
43  "Output format, onnx or tensorflow. Returns outputs in a way that can be easily "
44  "consumed by each frontend.");
45  }
46  TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.AllClassNonMaximumSuppressionAttrs",
48 }; // struct AllClassNonMaximumSuppressionAttrs
49 
51 struct ROIAlignAttrs : public AttrsNodeReflAdapter<ROIAlignAttrs> {
52  ffi::Array<int64_t> pooled_size;
53  double spatial_scale;
55  bool aligned;
56  ffi::String layout;
57  ffi::String mode;
58 
59  static void RegisterReflection() {
60  namespace refl = tvm::ffi::reflection;
61  refl::ObjectDef<ROIAlignAttrs>()
62  .def_ro("pooled_size", &ROIAlignAttrs::pooled_size, "Output size of roi align.")
63  .def_ro("spatial_scale", &ROIAlignAttrs::spatial_scale,
64  "Ratio of input feature map height (or width) to raw image height (or width).")
65  .def_ro("sample_ratio", &ROIAlignAttrs::sample_ratio,
66  "Optional sampling ratio of ROI align, using adaptive size by default.")
67  .def_ro("aligned", &ROIAlignAttrs::aligned,
68  "Whether to use the aligned ROIAlign semantics without the legacy 1-pixel clamp.")
69  .def_ro("layout", &ROIAlignAttrs::layout, "Dimension ordering of the input data.")
70  .def_ro("mode", &ROIAlignAttrs::mode, "Mode for ROI Align. Can be 'avg' or 'max'.");
71  }
73 }; // struct ROIAlignAttrs
74 
76 struct ROIPoolAttrs : public AttrsNodeReflAdapter<ROIPoolAttrs> {
77  ffi::Array<int64_t> pooled_size;
78  double spatial_scale;
79  ffi::String layout;
80 
81  static void RegisterReflection() {
82  namespace refl = tvm::ffi::reflection;
83  refl::ObjectDef<ROIPoolAttrs>()
84  .def_ro("pooled_size", &ROIPoolAttrs::pooled_size, "Output size of roi pool.")
85  .def_ro("spatial_scale", &ROIPoolAttrs::spatial_scale,
86  "Ratio of input feature map height (or width) to raw image height (or width).")
87  .def_ro("layout", &ROIPoolAttrs::layout, "Dimension ordering of the input data.");
88  }
90 }; // struct ROIPoolAttrs
91 
93 struct GetValidCountsAttrs : public AttrsNodeReflAdapter<GetValidCountsAttrs> {
95  int id_index;
97 
98  static void RegisterReflection() {
99  namespace refl = tvm::ffi::reflection;
100  refl::ObjectDef<GetValidCountsAttrs>()
101  .def_ro("score_threshold", &GetValidCountsAttrs::score_threshold,
102  "Lower limit of score for valid bounding boxes.")
103  .def_ro("id_index", &GetValidCountsAttrs::id_index,
104  "Index of the class categories, -1 to disable.")
105  .def_ro("score_index", &GetValidCountsAttrs::score_index,
106  "Index of the scores/confidence of boxes.");
107  }
108  TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.GetValidCountsAttrs", GetValidCountsAttrs,
109  BaseAttrsNode);
110 }; // struct GetValidCountsAttrs
111 
113 struct NonMaximumSuppressionAttrs : public AttrsNodeReflAdapter<NonMaximumSuppressionAttrs> {
117  int top_k;
120  int id_index;
125 
126  static void RegisterReflection() {
127  namespace refl = tvm::ffi::reflection;
128  refl::ObjectDef<NonMaximumSuppressionAttrs>()
129  .def_ro("max_output_size", &NonMaximumSuppressionAttrs::max_output_size,
130  "Max number of output valid boxes, -1 for no limit.")
131  .def_ro("iou_threshold", &NonMaximumSuppressionAttrs::iou_threshold,
132  "Non-maximum suppression IoU threshold.")
133  .def_ro("force_suppress", &NonMaximumSuppressionAttrs::force_suppress,
134  "Whether to suppress all detections regardless of class_id.")
135  .def_ro("top_k", &NonMaximumSuppressionAttrs::top_k,
136  "Keep maximum top k detections before nms, -1 for no limit.")
137  .def_ro("coord_start", &NonMaximumSuppressionAttrs::coord_start,
138  "Start index of the consecutive 4 coordinates.")
139  .def_ro("score_index", &NonMaximumSuppressionAttrs::score_index,
140  "Index of the scores/confidence of boxes.")
141  .def_ro("id_index", &NonMaximumSuppressionAttrs::id_index,
142  "Index of the class categories, -1 to disable.")
143  .def_ro("return_indices", &NonMaximumSuppressionAttrs::return_indices,
144  "Whether to return box indices in input data.")
145  .def_ro("invalid_to_bottom", &NonMaximumSuppressionAttrs::invalid_to_bottom,
146  "Whether to move all valid bounding boxes to the top.")
147  .def_ro("soft_nms_sigma", &NonMaximumSuppressionAttrs::soft_nms_sigma,
148  "Sigma for soft-NMS; 0.0 means standard hard NMS.")
149  .def_ro("score_threshold", &NonMaximumSuppressionAttrs::score_threshold,
150  "Score threshold for soft-NMS validity check; 0.0 when unused.");
151  }
152  TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.NonMaximumSuppressionAttrs",
154 }; // struct NonMaximumSuppressionAttrs
155 
157 struct MultiboxTransformLocAttrs : public AttrsNodeReflAdapter<MultiboxTransformLocAttrs> {
158  bool clip;
159  double threshold;
160  ffi::Array<double> variances;
162 
163  static void RegisterReflection() {
164  namespace refl = tvm::ffi::reflection;
165  refl::ObjectDef<MultiboxTransformLocAttrs>()
166  .def_ro("clip", &MultiboxTransformLocAttrs::clip,
167  "Clip decoded ymin,xmin,ymax,xmax to [0,1].")
168  .def_ro("threshold", &MultiboxTransformLocAttrs::threshold,
169  "After softmax, zero scores strictly below this value.")
170  .def_ro("variances", &MultiboxTransformLocAttrs::variances,
171  "(x,y,w,h) scales = TFLite 1/x_scale,1/y_scale,1/w_scale,1/h_scale on "
172  "encodings. Very large w/h scales can overflow exp in decode.")
173  .def_ro("keep_background", &MultiboxTransformLocAttrs::keep_background,
174  "If false, force output scores[:,0,:] to 0 (background class).");
175  }
176  TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.MultiboxTransformLocAttrs",
178 }; // struct MultiboxTransformLocAttrs
179 
180 } // namespace relax
181 } // namespace tvm
182 
183 #endif // TVM_RELAX_ATTRS_VISION_H_
Helpers for attribute objects.
Adapter for AttrsNode with the new reflection API.
Definition: attrs.h:391
Base class of all attribute class.
Definition: attrs.h:102
IR/AST nodes for the unified type system in TVM.
An object that builds and maintains block scope and StmtSref mapping for Dependence analysis.
Definition: analyzer.h:37
Attributes used in AllClassNonMaximumSuppression operator.
Definition: vision.h:36
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.AllClassNonMaximumSuppressionAttrs", AllClassNonMaximumSuppressionAttrs, BaseAttrsNode)
static void RegisterReflection()
Definition: vision.h:39
ffi::String output_format
Definition: vision.h:37
Attributes used in GetValidCounts operator.
Definition: vision.h:93
int id_index
Definition: vision.h:95
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.GetValidCountsAttrs", GetValidCountsAttrs, BaseAttrsNode)
static void RegisterReflection()
Definition: vision.h:98
int score_index
Definition: vision.h:96
double score_threshold
Definition: vision.h:94
Attributes for multibox_transform_loc (SSD / TFLite-style box decode).
Definition: vision.h:157
static void RegisterReflection()
Definition: vision.h:163
bool clip
Definition: vision.h:158
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.MultiboxTransformLocAttrs", MultiboxTransformLocAttrs, BaseAttrsNode)
ffi::Array< double > variances
Definition: vision.h:160
double threshold
Definition: vision.h:159
bool keep_background
Definition: vision.h:161
Attributes used in NonMaximumSuppression operator.
Definition: vision.h:113
bool return_indices
Definition: vision.h:121
bool force_suppress
Definition: vision.h:116
int score_index
Definition: vision.h:119
double iou_threshold
Definition: vision.h:115
int top_k
Definition: vision.h:117
double soft_nms_sigma
Definition: vision.h:123
int id_index
Definition: vision.h:120
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.NonMaximumSuppressionAttrs", NonMaximumSuppressionAttrs, BaseAttrsNode)
static void RegisterReflection()
Definition: vision.h:126
int max_output_size
Definition: vision.h:114
bool invalid_to_bottom
Definition: vision.h:122
int coord_start
Definition: vision.h:118
double score_threshold
Definition: vision.h:124
Attributes used in ROIAlign operator.
Definition: vision.h:51
static void RegisterReflection()
Definition: vision.h:59
ffi::String layout
Definition: vision.h:56
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.ROIAlignAttrs", ROIAlignAttrs, BaseAttrsNode)
bool aligned
Definition: vision.h:55
double spatial_scale
Definition: vision.h:53
ffi::String mode
Definition: vision.h:57
int sample_ratio
Definition: vision.h:54
ffi::Array< int64_t > pooled_size
Definition: vision.h:52
Attributes used in ROIPool operator.
Definition: vision.h:76
ffi::String layout
Definition: vision.h:79
static void RegisterReflection()
Definition: vision.h:81
TVM_FFI_DECLARE_OBJECT_INFO_FINAL("relax.attrs.ROIPoolAttrs", ROIPoolAttrs, BaseAttrsNode)
double spatial_scale
Definition: vision.h:78
ffi::Array< int64_t > pooled_size
Definition: vision.h:77