Support layout inference for transpose (#250)

Added interface GetProdeucerOp(tensor) in Graph Signed-off-by: yuenan.li <yuenan.li@verisilicon.com>
2021-12-29 11:06:28 +08:00 · 2021-12-29 11:06:28 +08:00 · 75d39e2cfd
parent aed3a48248
commit 75d39e2cfd
6 changed files with 122 additions and 10 deletions
--- a/include/tim/vx/graph.h
+++ b/include/tim/vx/graph.h
@ -69,9 +69,16 @@ class Graph {
      const std::shared_ptr<Tensor>& tensor,
      const Operation* op) = 0;

+  virtual void UpdateTensorProducerMap(
+      const std::shared_ptr<Tensor>& tensor,
+      const Operation* op) = 0;
+
  virtual const std::vector<std::shared_ptr<Operation>> GetConsumersOp(
      std::shared_ptr<Tensor> tensor) const = 0;

+  virtual std::vector<std::shared_ptr<Operation>> GetProducerOp(
+      std::shared_ptr<Tensor> tensor) = 0;
+
  virtual void PrintGraph() const = 0;

 protected:
--- a/src/tim/transform/layout_inference.cc
+++ b/src/tim/transform/layout_inference.cc
@ -59,6 +59,7 @@
 #include "ops/deconv2d_layout_inference.h"
 #include "ops/batchnorm_layout_inference.h"
 #include "ops/default_layout_inference.h"
+#include "ops/transpose_layout_inference.h"

 #include <algorithm>
 #include <deque>
@ -257,6 +258,7 @@ std::vector<std::shared_ptr<vx::Tensor>> HandleLayoutInfer(
    REGIST_LAYOUT_INFERENCE(VSI_NN_OP_ARGMIN, Arg);
    REGIST_LAYOUT_INFERENCE(VSI_NN_OP_DECONVOLUTION, DeConv2d);
    REGIST_LAYOUT_INFERENCE(VSI_NN_OP_BATCH_NORM, BatchNorm);
+    REGIST_LAYOUT_INFERENCE(VSI_NN_OP_PERMUTE, Transpose);
    REGIST_LOGICAL_LAYOUT_INFERENCE(VSI_NN_OP_LOGICAL_OPS);
    REGIST_REDUCE_LAYOUT_INFERENCE(VSI_NN_OP_REDUCE);
    // use default layout inference
--- a/src/tim/transform/ops/transpose_layout_inference.h
+++ b/src/tim/transform/ops/transpose_layout_inference.h
@ -0,0 +1,76 @@
+/****************************************************************************
+ *
+ *    Copyright (c) 2020 Vivante Corporation
+ *
+ *    Permission is hereby granted, free of charge, to any person obtaining a
+ *    copy of this software and associated documentation files (the "Software"),
+ *    to deal in the Software without restriction, including without limitation
+ *    the rights to use, copy, modify, merge, publish, distribute, sublicense,
+ *    and/or sell copies of the Software, and to permit persons to whom the
+ *    Software is furnished to do so, subject to the following conditions:
+ *
+ *    The above copyright notice and this permission notice shall be included in
+ *    all copies or substantial portions of the Software.
+ *
+ *    THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ *    IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ *    FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ *    AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ *    LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ *    FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
+ *    DEALINGS IN THE SOFTWARE.
+ *
+ *****************************************************************************/
+#ifndef TIM_LAYOUT_INFER_TRANSPOSE_LAYOUT_INFERENCE_H_
+#define TIM_LAYOUT_INFER_TRANSPOSE_LAYOUT_INFERENCE_H_
+
+#include "tim/vx/ops/transpose.h"
+
+#include "ops/op_layout_inference.h"
+#include "permute_vector.h"
+#include "operation_private.h"
+
+namespace tim {
+namespace transform {
+class TransposeLayoutInfer : public OpLayoutInfer {
+ public:
+  TransposeLayoutInfer(
+      const std::shared_ptr<vx::Operation> op,
+      std::shared_ptr<layout_inference_impl::LayoutInferContext>& context)
+      : OpLayoutInfer(op, context) {}
+
+  void OnInputs(
+      std::vector<std::shared_ptr<vx::Tensor>>& next_tensors) override {
+    auto src_input = op_->impl()->InputsTensor()[0];
+    auto infer_input = context_->GetMapedTensor(src_input);
+    auto input_pv = context_->GetPermuteVector(src_input);
+
+    std::vector<uint32_t> perm(op_->impl()->node()->nn_param.permute.dim_num);
+    memcpy(perm.data(), op_->impl()->node()->nn_param.permute.perm,
+           op_->impl()->node()->nn_param.permute.dim_num * sizeof(uint32_t));
+    IPermuteVectorPtr perm_pv = MakeShared(perm.size());
+    for (uint32_t i = 0; i < perm.size(); i++) {
+      perm_pv->At(i) = perm[i];
+    }
+
+    IPermuteVectorPtr final_pv = input_pv->Reverse()->Add(perm_pv);
+
+    if (final_pv->IsAligned()) {
+      //skip transpose op by treating its input as its output.
+      context_->UpdateTensorMap(op_->impl()->OutputsTensor()[0], infer_input);
+    } else {
+      auto transpose_op =
+          context_->infer_graph_->CreateOperation<tim::vx::ops::Transpose>(
+              final_pv->AsStdVec());
+      transpose_op->BindInput(infer_input);
+      auto infer_out = CreateOutputsTensor(final_pv);
+      transpose_op->BindOutput(infer_out[0]);
+    }
+    context_->SetPermuteVector(op_->impl()->OutputsTensor()[0], MakeShared(perm.size()));
+    next_tensors.push_back(op_->impl()->OutputsTensor()[0]);
+  }
+};
+
+}  // namespace transform
+}  // namespace tim
+#endif
--- a/src/tim/vx/graph.cc
+++ b/src/tim/vx/graph.cc
@ -87,6 +87,15 @@ void GraphImpl::UpdateTensorConsumersMap(const std::shared_ptr<Tensor>& tensor,
  }
 }

+void GraphImpl::UpdateTensorProducerMap(const std::shared_ptr<Tensor>& tensor,
+                                         const Operation* op) {
+  for (const auto& added_op : op_vector_) {
+    if (added_op.get() == op) {
+      tensor_producer_[tensor].push_back(added_op);
+    }
+  }
+}
+
 const std::vector<std::shared_ptr<Operation>> GraphImpl::GetConsumersOp(
    std::shared_ptr<Tensor> tensor) const {
  auto consumers = tensor_consumers_.find(tensor);
@ -98,6 +107,17 @@ const std::vector<std::shared_ptr<Operation>> GraphImpl::GetConsumersOp(
  }
 }

+std::vector<std::shared_ptr<Operation>> GraphImpl::GetProducerOp(
+    std::shared_ptr<Tensor> tensor)  {
+  auto producer = tensor_producer_.find(tensor);
+  if (tensor_producer_.end() != producer) {
+    return producer->second;
+  } else {
+    VSILOGD("Tensor has no producer, may be graph input.");
+    return {};
+  }
+}
+
 void GraphImpl::PrintGraph() const { vsi_nn_PrintGraph(this->graph_); }

 std::shared_ptr<Tensor> GraphImpl::CreateTensor(const TensorSpec& spec,
--- a/src/tim/vx/graph_private.h
+++ b/src/tim/vx/graph_private.h
@ -56,19 +56,24 @@ class GraphImpl : public Graph {

  void UpdateTensorConsumersMap(const std::shared_ptr<Tensor>& tensor,
                                const Operation* op) override;
+  void UpdateTensorProducerMap(const std::shared_ptr<Tensor>& tensor,
+                                const Operation* op) override;
  const std::vector<std::shared_ptr<Operation>> GetConsumersOp(
      std::shared_ptr<Tensor> tensor) const override;
-  void PrintGraph() const override;
-  /// Implement parents' virtual functions
-   std::shared_ptr<Tensor> CreateTensor(const TensorSpec& spec,
-                                       const void* data = nullptr) override;
-   std::shared_ptr<Tensor> CreateTensor(const TensorSpec& spec,
-                                               const DmaBufferDesc& dmafd) override;
-   std::shared_ptr<Tensor> CreateTensorPlaceHolder() override;
-    bool Compile() override;
+  std::vector<std::shared_ptr<Operation>> GetProducerOp(
+      std::shared_ptr<Tensor> tensor) override;

-   bool CompileToBinary(void* buf, size_t* size) override;
-   bool Run() override;
+  void PrintGraph() const override;
+
+  std::shared_ptr<Tensor> CreateTensor(const TensorSpec& spec,
+                                       const void* data = nullptr) override;
+  std::shared_ptr<Tensor> CreateTensor(const TensorSpec& spec,
+                                       const DmaBufferDesc& dmafd) override;
+  std::shared_ptr<Tensor> CreateTensorPlaceHolder() override;
+
+  bool Compile() override;
+  bool CompileToBinary(void* buf, size_t* size) override;
+  bool Run() override;

 protected:
  ContextImpl* context_;
@ -82,6 +87,7 @@ class GraphImpl : public Graph {
  std::vector<std::shared_ptr<Tensor>> inputs_tensor_;
  std::vector<std::shared_ptr<Tensor>> outputs_tensor_;
  std::map<std::shared_ptr<Tensor>, std::vector<std::shared_ptr<Operation>>> tensor_consumers_;
+  std::map<std::shared_ptr<Tensor>, std::vector<std::shared_ptr<Operation>>> tensor_producer_;
 };

 }  // namespace vx
--- a/src/tim/vx/operation.cc
+++ b/src/tim/vx/operation.cc
@ -100,6 +100,7 @@ Operation& Operation::BindInput(const std::shared_ptr<Tensor>& tensor) {

 Operation& Operation::BindOutput(const std::shared_ptr<Tensor>& tensor) {
  impl_->BindOutput(tensor);
+  impl_->graph_->UpdateTensorProducerMap(tensor, this);
  return *this;
 }