api/doxygen/x86_2bnn_8h_source.html

 /*

  * Licensed to the Apache Software Foundation (ASF) under one

  * or more contributor license agreements.  See the NOTICE file

  * distributed with this work for additional information

  * regarding copyright ownership.  The ASF licenses this file

  * to you under the Apache License, Version 2.0 (the

  * "License"); you may not use this file except in compliance

  * with the License.  You may obtain a copy of the License at

  *

  *   http://www.apache.org/licenses/LICENSE-2.0

  *

  * Unless required by applicable law or agreed to in writing,

  * software distributed under the License is distributed on an

  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY

  * KIND, either express or implied.  See the License for the

  * specific language governing permissions and limitations

  * under the License.

  */


 #ifndef TVM_TOPI_X86_BNN_H_

 #define TVM_TOPI_X86_BNN_H_


 #include <tvm/target/generic_func.h>

 #include <tvm/te/operation.h>

 #include <tvm/topi/detail/fuse.h>

 #include <tvm/topi/tags.h>


 namespace tvm {

 namespace topi {


 using namespace tvm::te;


 namespace x86 {

 inline Schedule schedule_binarize_pack(const Target& target, const Array<Tensor>& outs) {

   Array<Operation> out_ops;

   for (auto t : outs) {

     out_ops.push_back(t->op);

   }

   auto s = create_schedule(out_ops);


   auto _schedule = [&](const Tensor& out) {

     s[out].parallel(out->op.as<ComputeOpNode>()->axis[0]);

   };


   std::function<void(Operation)> traverse;

   traverse = [&](const Operation& op) {

     if (op->tag == "binarize_pack") {

       _schedule(op.output(0));

     } else {

       LOG(ERROR) << "Unsupported operator " << op->tag;

     }

   };


   traverse(outs[0]->op);

   return s;

 }


 inline Schedule schedule_binary_dense(const Target& target, const Array<Tensor>& outs) {

   Array<Operation> out_ops;

   for (auto t : outs) {

     out_ops.push_back(t->op);

   }

   auto s = create_schedule(out_ops);


   auto _schedule = [&](const Tensor& A, const Tensor& B, const Tensor& C) {

     IterVar co, ci;

     s[C].split(s[C]->op.as<ComputeOpNode>()->reduce_axis[0], 8, &co, &ci);

     s[C].parallel(s[C]->op.as<ComputeOpNode>()->axis[0]);


     Tensor out;

     if (detail::contains(s->outputs, C->op)) {

       out = C;

     } else {

       out = outs[0]->op.output(0);

     }


     IterVar xo, xi;

     s[out].split(out->op.as<ComputeOpNode>()->axis[1], 8, &xo, &xi);

     s[out].vectorize(xi);

   };


   std::function<void(Operation)> traverse;

   traverse = [&](const Operation& op) {

     // Inline all one-to-one-mapping operators except the last stage (output)

     if (is_broadcast(op->tag)) {

       if (!detail::contains(s->outputs, op)) {

         s[op].compute_inline();

       }

       for (auto tensor : op->InputTensors()) {

         if (tensor->op->InputTensors().size() > 0) {

           traverse(tensor->op);

         }

       }

     } else if (op->tag == "binary_dense") {

       auto output = op.output(0);

       auto data = op->InputTensors()[0];

       auto weight = op->InputTensors()[1];

       _schedule(data, weight, output);

     } else {

       LOG(ERROR) << "Unsupported operator " << op->tag;

     }

   };


   traverse(outs[0]->op);

   return s;

 }


 }  // namespace x86

 }  // namespace topi

 }  // namespace tvm

 #endif  // TVM_TOPI_X86_BNN_H_

tvm::Target
Managed reference class to TargetNode.
Definition: target.h:200

tvm::runtime::Array
Array, container representing a contiguous sequence of ObjectRefs.
Definition: array.h:289

tvm::runtime::Array::push_back
void push_back(const T &item)
push a new item to the back of the list
Definition: array.h:457

tvm::runtime::ObjectRef::as
const ObjectType * as() const
Try to downcast the internal Object to a raw pointer of a corresponding type.
Definition: object.h:910

tvm::te::BaseComputeOpNode::axis
Array< IterVar > axis
IterVar on each axis.
Definition: operation.h:207

tvm::te::BaseComputeOpNode::reduce_axis
Array< IterVar > reduce_axis
IterVar on each reduction axis, if the body is a Reduce.
Definition: operation.h:209

tvm::te::ComputeOpNode
A Compute op that compute a tensor on certain domain.
Definition: operation.h:226

tvm::te::Operation
Operation that produces tensors.
Definition: tensor.h:47

tvm::te::Schedule
Global schedule container For operations and all the operations they depend on. The schedule per Oper...
Definition: schedule.h:326

tvm::te::Tensor
Tensor structure representing a possible input, or intermediate computation result.
Definition: tensor.h:102

tvm::tir::IterVar
Iteration Variable, represents an iteration over an integer interval.
Definition: var.h:315

fuse.h
Fuse operation.

generic_func.h
Generic function that can be specialzied on a per target basis.

tvm::te
Tensor expression language DSL.
Definition: extracted_task.h:33

tvm::te::create_schedule
Schedule create_schedule(Array< Operation > ops)
Create a schedule for array of ops(and their dependencies).
Definition: schedule.h:702

tvm::topi::x86::schedule_binarize_pack
Schedule schedule_binarize_pack(const Target &target, const Array< Tensor > &outs)
Create a generic schedule for binarize_pack.
Definition: bnn.h:46

tvm::topi::x86::schedule_binary_dense
Schedule schedule_binary_dense(const Target &target, const Array< Tensor > &outs)
Create a generic schedule for binary_dense.
Definition: bnn.h:78

tvm::topi::is_broadcast
bool is_broadcast(std::string tag)
Definition: tags.h:47

tvm
runtime implementation for LibTorch/TorchScript.
Definition: analyzer.h:36

operation.h
Operation node can generate one or multiple Tensors.

tags.h
External function interface to rocBLAS libraries.