tvm
schedule.h
Go to the documentation of this file.
1 /*
2  * Licensed to the Apache Software Foundation (ASF) under one
3  * or more contributor license agreements. See the NOTICE file
4  * distributed with this work for additional information
5  * regarding copyright ownership. The ASF licenses this file
6  * to you under the Apache License, Version 2.0 (the
7  * "License"); you may not use this file except in compliance
8  * with the License. You may obtain a copy of the License at
9  *
10  * http://www.apache.org/licenses/LICENSE-2.0
11  *
12  * Unless required by applicable law or agreed to in writing,
13  * software distributed under the License is distributed on an
14  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
15  * KIND, either express or implied. See the License for the
16  * specific language governing permissions and limitations
17  * under the License.
18  */
19 
24 // Acknowledgement: Many schedule primitives originate from Halide and Loopy.
25 #ifndef TVM_TE_SCHEDULE_H_
26 #define TVM_TE_SCHEDULE_H_
27 
28 #include <tvm/support/with.h>
29 #include <tvm/te/tensor.h>
30 #include <tvm/te/tensor_intrin.h>
31 #include <tvm/tir/expr.h>
32 #include <tvm/tir/index_map.h>
33 
34 #include <string>
35 #include <unordered_map>
36 
37 namespace tvm {
38 namespace te {
39 // Node container for Stage
40 class StageNode;
41 // Node container for Schedule
42 class ScheduleNode;
43 // Node container for IterVarRelation
44 class IterVarRelationNode;
45 // Attribute of itervar.
46 class IterVarAttrNode;
47 
49 enum AttachType : int {
51  kInline = 2,
53  kScope = 4,
55 };
56 
58 class Stage : public ObjectRef {
59  public:
60  Stage() {}
61  explicit Stage(ObjectPtr<Object> n) : ObjectRef(n) {}
66  explicit Stage(Operation op);
71  inline const StageNode* operator->() const;
76  inline StageNode* operator->();
81  TVM_DLL Stage& set_scope(std::string scope); // NOLINT(*)
88  TVM_DLL Stage& compute_at(Stage parent, IterVar scope); // NOLINT(*)
93  TVM_DLL Stage& compute_inline(); // NOLINT(*)
98  TVM_DLL Stage& compute_root(); // NOLINT(*)
106  TVM_DLL Stage& bind(IterVar ivar, IterVar thread_ivar);
117  TVM_DLL Stage& set_store_predicate(PrimExpr predicate);
126  TVM_DLL Stage& env_threads(Array<IterVar> threads);
135  TVM_DLL Stage& split(IterVar parent, PrimExpr factor, IterVar* p_outer,
136  IterVar* p_inner); // NOLINT(*)
146  TVM_DLL Stage& split_by_nparts(IterVar parent, PrimExpr nparts, IterVar* p_outer,
147  IterVar* p_inner); // NOLINT(*)
155  TVM_DLL Stage& fuse(IterVar outer, IterVar inner, IterVar* p_target); // NOLINT(*)
169  TVM_DLL Stage& fuse(const Array<IterVar>& axes, IterVar* p_target); // NOLINT(*)
175  TVM_DLL Stage& reorder(const Array<IterVar>& order); // NOLINT(*)
191  TVM_DLL Stage& tile(IterVar x_parent, IterVar y_parent, // NOLINT(*)
192  PrimExpr x_factor, PrimExpr y_factor, IterVar* p_x_outer, IterVar* p_y_outer,
193  IterVar* p_x_inner, IterVar* p_y_inner);
199  TVM_DLL Stage& vectorize(IterVar var); // NOLINT(*)
207  TVM_DLL Stage& tensorize(IterVar var, TensorIntrin f); // NOLINT(*)
213  TVM_DLL Stage& unroll(IterVar var); // NOLINT(*)
219  TVM_DLL Stage& parallel(IterVar var); // NOLINT(*)
229  TVM_DLL Stage& pragma(IterVar var, const std::string& pragma_type,
230  const PrimExpr& pragma_value = PrimExpr()); // NOLINT(*)
238  TVM_DLL Stage& prefetch(const Tensor& domain, IterVar var, PrimExpr offset); // NOLINT(*)
249  TVM_DLL Stage& storage_align(IterVar axis, int factor, int offset); // NOLINT(*)
254  TVM_DLL Stage& double_buffer(); // NOLINT(*)
259  TVM_DLL Stage& rolling_buffer(); // NOLINT(*)
284  TVM_DLL Stage& transform_layout(const Array<Var>& initial_indices,
285  const Array<PrimExpr>& final_indices,
286  Array<IterVar>* out_iter_vars = nullptr);
299  bool is_scheduled() const;
307  Stage GetAttachSpec() const;
308  // declare container type
310 };
311 
317 class Schedule : public ObjectRef {
318  public:
319  Schedule() {}
326  TVM_DLL explicit Schedule(Array<Operation> ops);
331  Schedule copy() const;
336  TVM_DLL Stage operator[](const Operation& op);
342  TVM_DLL Stage operator[](const Tensor& tensor) { return this->operator[](tensor->op); }
352  TVM_DLL Stage create_group(const Array<Tensor>& outputs, const Array<Tensor>& inputs,
353  bool include_inputs = false);
363  TVM_DLL Tensor cache_read(const Tensor& tensor, const std::string& scope,
364  const Array<Operation>& readers);
381  TVM_DLL Array<Tensor> cache_write(const Array<Tensor>& tensor, const std::string& scope);
398  TVM_DLL Tensor cache_write(const Tensor& tensor, const std::string& scope);
412  TVM_DLL Array<Tensor> rfactor(const Tensor& tensor, const IterVar& axis, int factor_axis = 0);
421  Schedule normalize();
422 
432  Schedule normalize_for_feature_extraction();
433 
438  inline const ScheduleNode* operator->() const;
443  inline ScheduleNode* operator->();
444  // declare container type
446 };
447 
452 class IterVarRelation : public ObjectRef {
453  public:
460  inline const IterVarRelationNode* operator->() const;
461 };
462 
466 class IterVarAttr : public ObjectRef {
467  public:
474  inline const IterVarAttrNode* operator->() const;
475 };
476 
492 class StageNode : public Object {
493  public:
544  AttachType attach_type{kGroupRoot};
550  std::string scope;
552  bool is_output{false};
554  bool double_buffer{false};
556  bool rolling_buffer{false};
571  int num_child_stages{0};
572 
574  v->Visit("op", &op);
575  v->Visit("origin_op", &origin_op);
576  v->Visit("all_iter_vars", &all_iter_vars);
577  v->Visit("leaf_iter_vars", &leaf_iter_vars);
578  v->Visit("env_threads", &env_threads);
579  v->Visit("relations", &relations);
580  v->Visit("iter_var_attrs", &iter_var_attrs);
581  v->Visit("attach_type", &attach_type);
582  v->Visit("attach_ivar", &attach_ivar);
583  v->Visit("attach_stage", &attach_stage);
584  v->Visit("scope", &scope);
585  v->Visit("is_output", &is_output);
586  v->Visit("double_buffer", &double_buffer);
587  v->Visit("layout_transforms", &layout_transforms);
588  v->Visit("axis_separators", &axis_separators);
589  v->Visit("group", &group);
590  v->Visit("num_child_stages", &num_child_stages);
591  }
592 
593  static constexpr const char* _type_key = "Stage";
595 };
596 
598 class ScheduleNode : public Object {
599  public:
617  std::unordered_map<const Object*, Stage> op2stage_cache_;
618 
620  v->Visit("outputs", &outputs);
621  v->Visit("stages", &stages);
622  v->Visit("groups", &groups);
623  v->Visit("stage_map", &stage_map);
624  }
625 
627  void InitCache();
629  void InvalidateCache();
630 
636  TVM_DLL bool Contain(const Operation& op) const;
637 
643  TVM_DLL bool Contain(const Tensor& tensor) const { return Contain(tensor->op); }
644 
645  static constexpr const char* _type_key = "Schedule";
647 };
648 
654 inline Schedule create_schedule(Array<Operation> ops) { return Schedule(ops); }
655 
657 class IterVarAttrNode : public Object {
658  public:
660  IterVarType iter_type{kDataPar};
673  int dim_align_factor{0};
675  int dim_align_offset{0};
684 
686  v->Visit("iter_type", &iter_type);
687  v->Visit("bind_thread", &bind_thread);
688  v->Visit("prefetch_data", &prefetch_data);
689  v->Visit("prefetch_offset", &prefetch_offset);
690  v->Visit("tensor_intrin", &tensor_intrin);
691  v->Visit("dim_align_factor", &dim_align_factor);
692  v->Visit("dim_align_offset", &dim_align_offset);
693  v->Visit("pragma_keys", &pragma_keys);
694  v->Visit("pragma_values", &pragma_values);
695  }
696 
697  static constexpr const char* _type_key = "IterVarAttr";
699 };
700 
702 class IterVarRelationNode : public Object {
703  public:
704  static constexpr const char* _type_key = "IterVarRelation";
706 };
707 
713  public:
724 
726  v->Visit("parent", &parent);
727  v->Visit("outer", &outer);
728  v->Visit("inner", &inner);
729  v->Visit("factor", &factor);
730  v->Visit("nparts", &nparts);
731  }
732 
733  static constexpr const char* _type_key = "Split";
735 };
736 
741 class Split : public IterVarRelation {
742  public:
743  TVM_DLL Split(IterVar parent, IterVar outer, IterVar inner, PrimExpr factor, PrimExpr nparts);
744 
746 };
747 
752  public:
759 
761  v->Visit("outer", &outer);
762  v->Visit("inner", &inner);
763  v->Visit("fused", &fused);
764  }
765 
766  static constexpr const char* _type_key = "Fuse";
768 };
769 
774 class Fuse : public IterVarRelation {
775  public:
776  TVM_DLL Fuse(IterVar outer, IterVar inner, IterVar fused);
777 
779 };
780 
787  public:
792 
794  v->Visit("parent", &parent);
795  v->Visit("rebased", &rebased);
796  }
797 
798  static constexpr const char* _type_key = "Rebase";
800 };
801 
806 class Rebase : public IterVarRelation {
807  public:
808  TVM_DLL Rebase(IterVar parent, IterVar rebased);
809 
811 };
812 
817  public:
820 
821  void VisitAttrs(AttrVisitor* v) { v->Visit("iter", &iter); }
822 
823  static constexpr const char* _type_key = "Singleton";
825 };
826 
831 class Singleton : public IterVarRelation {
832  public:
833  TVM_DLL explicit Singleton(IterVar iter);
834 
836 };
837 
842  public:
851 
859 
865 
872 
874  v->Visit("original_variables", &original_variables);
875  v->Visit("transformed_variables", &transformed_variables);
876  v->Visit("forward_transformation", &forward_transformation);
877  v->Visit("inverse_transformation", &inverse_transformation);
878  }
879 
880  static constexpr const char* _type_key = "Transform";
882 };
883 
884 class Transform : public IterVarRelation {
885  public:
886  TVM_DLL explicit Transform(Array<IterVar> original_variables,
887  Array<IterVar> transformed_variables, IndexMap forward_transformation,
888  IndexMap inverse_transformation);
889 
891 };
892 
895  public:
902 
903  void VisitAttrs(AttrVisitor* v) { v->Visit("clauses", &clauses); }
904 
905  static constexpr const char* _type_key = "SpecializedCondition";
907 };
908 
913  public:
918  TVM_DLL SpecializedCondition(Array<PrimExpr> conditions); // NOLINT(*)
919 
924  TVM_DLL static SpecializedCondition Current();
925 
927  class Internal;
928 
929  private:
930  // enable with syntax.
931  friend class Internal;
932  friend class With<SpecializedCondition>;
934  TVM_DLL void EnterWithScope();
936  TVM_DLL void ExitWithScope();
937 };
938 
939 // implementations
940 inline const StageNode* Stage::operator->() const { return static_cast<const StageNode*>(get()); }
941 inline StageNode* Stage::operator->() { return static_cast<StageNode*>(get_mutable()); }
942 
943 inline const ScheduleNode* Schedule::operator->() const {
944  return static_cast<const ScheduleNode*>(get());
945 }
946 inline ScheduleNode* Schedule::operator->() { return static_cast<ScheduleNode*>(get_mutable()); }
947 
949  return static_cast<const IterVarRelationNode*>(get());
950 }
951 
953  return static_cast<const IterVarAttrNode*>(get());
954 }
955 
956 } // namespace te
957 } // namespace tvm
958 #endif // TVM_TE_SCHEDULE_H_
Array< Stage > groups
List of all stage groups.
Definition: schedule.h:610
Stage()
Definition: schedule.h:60
Split the parent domain into product of outer and iter.
Definition: schedule.h:712
Array< IterVar > original_variables
The loop variables that were replaced by the transformation.
Definition: schedule.h:850
Stage & compute_root()
Compute the function at group root.
Managed reference to RebaseNode.
Definition: schedule.h:806
represents a stage.
Definition: schedule.h:492
A custom smart pointer for Object.
Definition: object.h:358
IterVar bind_thread
The thread this iter Var binds, can be null.
Definition: schedule.h:662
Global schedule container For operations and all the operations they depend on. The schedule per Oper...
Definition: schedule.h:317
IterVar outer
The outer domain.
Definition: schedule.h:754
Stage operator[](const Tensor &tensor)
Short hand for getting the stage of tensor&#39;s operation.
Definition: schedule.h:342
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:573
Schedule create_schedule(Array< Operation > ops)
Create a schedule for array of ops(and their dependencies).
Definition: schedule.h:654
Stage(ObjectPtr< Object > n)
Definition: schedule.h:61
Array< Operation > outputs
The output operations in original data flow graph.
Definition: schedule.h:601
Definition: schedule.h:54
const IterVarRelationNode * operator->() const
access the internal node container
Definition: schedule.h:948
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:619
Fuse two domains into one domain.
Definition: schedule.h:751
Stage attach_stage
The stage this node attaches to.
Definition: schedule.h:548
runtime implementation for LibTorch/TorchScript.
Definition: analyzer.h:36
IterVar fused
The target domain.
Definition: schedule.h:758
IterVar inner
The inner domain.
Definition: schedule.h:719
IndexMap inverse_transformation
Map from transformed variables to the original variables.
Definition: schedule.h:871
Schedule()
Definition: schedule.h:319
Operation that produces tensors.
Definition: tensor.h:47
IterVar inner
The inner domain.
Definition: schedule.h:756
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:793
Iteration Variable, represents an iteration over an integer interval.
Definition: var.h:301
PrimExpr nparts
Number of parts, only factor or nparts can be given.
Definition: schedule.h:723
Stage, contains scheduling for a stage of computation.
Definition: schedule.h:58
IndexMap forward_transformation
Map from the original variables to the transformed variables.
Definition: schedule.h:864
IterVar attach_ivar
The attach point of this schedule.
Definition: schedule.h:546
Stage & compute_at(Stage parent, IterVar scope)
specify the schedule to be computed at the parent schedule&#39;s scope.
AttachType
the attachment type
Definition: schedule.h:49
Array< IntImm > axis_separators
List of axes after which to divide physical axes.
Definition: schedule.h:564
Specialized condition to enable op specialization.
Definition: schedule.h:912
base class of all object containers.
Definition: object.h:167
std::string scope
The thread storage scope level of the stage.
Definition: schedule.h:550
Array< IterVar > all_iter_vars
All the nodes in the iter var.
Definition: schedule.h:518
Stage & set_scope(std::string scope)
set the memory scope of the stage
Operation op
The operation of stage, can be different from original op. If it is null, then this stage is a group ...
Definition: schedule.h:498
Definition: schedule.h:51
Managed reference to SplitNode.
Definition: schedule.h:741
Stage & set_store_predicate(PrimExpr predicate)
Set the predicate to determine whether a store to the array should be performed. Use this when there ...
Defines a remapping of buffer indices.
IterVarAttr()
Definition: schedule.h:468
bool is_scheduled() const
whether the stage has been scheduled.
Stage & double_buffer()
Compute current stage with double buffering.
Container for specialization conditions.
Definition: schedule.h:894
Visitor class to get the attributes of an AST/IR node. The content is going to be called for each fie...
Definition: reflection.h:52
TensorIntrin tensor_intrin
Tensor intrinsic used in tensorization, when the axis is marked as Tensorized.
Definition: schedule.h:671
Dataflow tensor object.
Definition: schedule.h:884
Stage & unroll(IterVar var)
Unroll iteration.
IterVarType
Type of iteration variable. Each IterVar have a specific type.
Definition: var.h:178
Rebase the iteration to make min to be 0. This is useful to normalize the Schedule to make every leaf...
Definition: schedule.h:786
Stage group
The parent group of the current stage. The stage cannot be assigned to stages outside the group...
Definition: schedule.h:569
The schedule relation between IterVars can be Split, Fuse.
Definition: schedule.h:452
Managed reference to TensorIntrinNode.
Definition: tensor_intrin.h:93
Array< IndexMap > layout_transforms
Layout transformations to be applied onto the stage&#39;s tensors.
Definition: schedule.h:558
TIR expressions.
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:760
IterVarRelation(ObjectPtr< Object > n)
Definition: schedule.h:455
Definition: schedule.h:50
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289
Definition: index_map.h:167
Stage & transform_layout(const Array< Var > &initial_indices, const Array< PrimExpr > &final_indices, Array< IterVar > *out_iter_vars=nullptr)
Defines a layout transformation to be applied to the buffer.
Stage & reorder(const Array< IterVar > &order)
Reorder the iteration.
Array< Tensor > prefetch_data
List of tensor to be prefetched in this loop.
Definition: schedule.h:664
const StageNode * operator->() const
access the internal node container
Definition: schedule.h:940
node container for IterVar attr
Definition: schedule.h:657
Managed reference to SingletonNode.
Definition: schedule.h:831
const IterVarAttrNode * operator->() const
access the internal node container
Definition: schedule.h:952
Stage & set_axis_separators(const Array< IntImm > &axis_separators)
Defines separators between groups of axes.
Stage & compute_inline()
Compute the function inline.
Array< IterVar > env_threads
Specify threads to be launched at the stage. This is only valid for composite ops such as Scan...
Definition: schedule.h:532
Stage & tile(IterVar x_parent, IterVar y_parent, PrimExpr x_factor, PrimExpr y_factor, IterVar *p_x_outer, IterVar *p_y_outer, IterVar *p_x_inner, IterVar *p_y_inner)
Perform tiling on two dimensions The final loop order from outmost to inner most are [x_outer...
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:873
const ScheduleNode * operator->() const
access the internal node container
Definition: schedule.h:943
#define TVM_DEFINE_OBJECT_REF_METHODS(TypeName, ParentType, ObjectName)
Definition: object.h:713
Transform iterator according to some arbitrary expression.
Definition: schedule.h:841
RAII wrapper function to enter and exit a context object similar to python&#39;s with syntax...
Definition: with.h:58
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:685
Data parallel iteration. This normally corresponds to axis of Tensor. Allow all IterVar manipulations...
Definition: var.h:187
Array< IterVar > leaf_iter_vars
The current active leaf iter vars in the stage.
Definition: schedule.h:526
Definition: schedule.h:52
IterVar parent
The parent domain.
Definition: schedule.h:715
Var var(std::string name_hint, DataType t=DataType::Int(32))
Construct a new Var expression.
Base class of all object reference.
Definition: object.h:511
Singleton iterator [0, 1)
Definition: schedule.h:816
Stage & parallel(IterVar var)
Parallelize iteration.
Definition: schedule.h:53
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102
Array< PrimExpr > pragma_keys
Additional pragma keys, array of StringImm.
Definition: schedule.h:679
Managed reference to FuseNode.
Definition: schedule.h:774
PrimExpr factor
The split factor.
Definition: schedule.h:721
Stage & env_threads(Array< IterVar > threads)
Specify environment threads that launched around the group&#39;s scope. This can only be used in group st...
constexpr const char * axis_separators
Marks the physical axis separators.
Definition: stmt.h:1428
Stage & vectorize(IterVar var)
Vectorize iteration.
#define TVM_DECLARE_FINAL_OBJECT_INFO(TypeName, ParentType)
helper macro to declare type information in a final class.
Definition: object.h:671
Tensor intrinsic operations.
Schedule(ObjectPtr< Object > n)
Definition: schedule.h:320
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:821
Stage & bind(IterVar ivar, IterVar thread_ivar)
Bind the IterVar to thread index.
Stage & rolling_buffer()
Compute current stage with rolling buffering.
Map container of NodeRef->NodeRef in DSL graph. Map implements copy on write semantics, which means map is mutable but copy will happen when array is referenced in more than two places.
Definition: map.h:1271
Stage & pragma(IterVar var, const std::string &pragma_type, const PrimExpr &pragma_value=PrimExpr())
Annotate the iteration with pragma.
Array< IterVar > transformed_variables
The variables generated by the transformation.
Definition: schedule.h:858
Map< IterVar, IterVarAttr > iter_var_attrs
additional attributes about iter var.
Definition: schedule.h:542
PrimExpr store_predicate
The predicate under which store can happen Use this when there can be duplicated threads doing the sa...
Definition: schedule.h:538
Array< IterVarRelation > relations
The relation bwteen of IterVars.
Definition: schedule.h:540
Stage GetAttachSpec() const
Get attachment spec of current stage. If the stage compute at Group root, this function will traverse...
IterVar rebased
The inner domain.
Definition: schedule.h:791
IterVarRelation()
Definition: schedule.h:454
Stage & split(IterVar parent, PrimExpr factor, IterVar *p_outer, IterVar *p_inner)
Split the parent by factor, generate.
IterVar outer
The outer domain.
Definition: schedule.h:717
Operation origin_op
The original operator. The op field can change during schedule to alternate the dataflow, while origin_op remains fixed.
Definition: schedule.h:504
Stage & fuse(IterVar outer, IterVar inner, IterVar *p_target)
Fuse the inner outer domain to the target.
IterVarAttr(ObjectPtr< Object > n)
Definition: schedule.h:469
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:903
base node of iteration var
Definition: schedule.h:702
Reference to PrimExprNode.
Definition: expr.h:112
std::vector< std::string > Split(const std::string &str, const std::string &sub)
Split str according to substring.
Definition: einsum.h:425
void VisitAttrs(AttrVisitor *v)
Definition: schedule.h:725
node container for schedule
Definition: schedule.h:598
std::unordered_map< const Object *, Stage > op2stage_cache_
Internal stage map to map internal ops to stages. This is created on demand and can be invalidated...
Definition: schedule.h:617
Stage & storage_align(IterVar axis, int factor, int offset)
Set alignment requirement for specific dimension.
bool Contain(const Tensor &tensor) const
Check if the schedule contains a Tensor.
Definition: schedule.h:643
Object * get_mutable() const
Definition: object.h:576
Stage & split_by_nparts(IterVar parent, PrimExpr nparts, IterVar *p_outer, IterVar *p_inner)
Split the iteration with given number of parts.
Array< PrimExpr > prefetch_offset
The offset used in each prefetch.
Definition: schedule.h:666
Array< Stage > stages
list of all stages for ops. The stages are sorted in dependency order.
Definition: schedule.h:606
#define TVM_DECLARE_BASE_OBJECT_INFO(TypeName, ParentType)
helper macro to declare a base object type that can be inherited.
Definition: object.h:648
Additional scheduable attributes about IterVar.
Definition: schedule.h:466
Stage & tensorize(IterVar var, TensorIntrin f)
Replace computation of the current stage by tensor intrinsic f.
Array< PrimExpr > pragma_values
Additional values of pragma, if any.
Definition: schedule.h:683
Map< Operation, Stage > stage_map
map of original operation to the stages
Definition: schedule.h:612
Array< PrimExpr > clauses
List of conditions in conjunctive joint form (CNF). Each condition should be a simple expression...
Definition: schedule.h:901
IterVar iter
The singleton iterator.
Definition: schedule.h:819
Stage & prefetch(const Tensor &domain, IterVar var, PrimExpr offset)
Fetch data in advance.
RAII wrapper function to enter and exit a context object similar to python&#39;s with syntax...
IterVar parent
The parent domain.
Definition: schedule.h:789