[MLIR][MHLO] Add pattern to move ops into the assuming region

This will eventually allow to make assuming regions' constraints independent from each other. PiperOrigin-RevId: 365985081
2021-03-31 01:22:20 -07:00 · 2021-03-31 01:22:20 -07:00 · eade942635
parent 5ec66775d4
commit eade942635
2 changed files with 125 additions and 0 deletions
--- a/lib/Dialect/mhlo/transforms/move_up_dynamic_broadcasts_for_fusion.cc
+++ b/lib/Dialect/mhlo/transforms/move_up_dynamic_broadcasts_for_fusion.cc
@ -25,6 +25,7 @@ limitations under the License.
 #include "mlir/Dialect/Shape/IR/Shape.h"
 #include "mlir/Dialect/StandardOps/IR/Ops.h"
 #include "mlir/Dialect/Tensor/IR/Tensor.h"
+#include "mlir/IR/BlockAndValueMapping.h"
 #include "mlir/IR/BuiltinOps.h"
 #include "mlir/IR/BuiltinTypes.h"
 #include "mlir/IR/MLIRContext.h"
@ -96,6 +97,71 @@ struct InlineBroadcastedShapeOperandsPattern : public OpRewritePattern<OpTy> {
  }
 };

+/// Move operation into a preceeding assuming op. This allows to process
+/// operations that depend on the assuming op's results. It will eventually
+/// allow to make assuming regions' constraints independent from each other.
+template <typename OpTy>
+struct MoveIntoAssumingOpPattern : public OpRewritePattern<OpTy> {
+  using OpRewritePattern<OpTy>::OpRewritePattern;
+
+  LogicalResult matchAndRewrite(OpTy op,
+                                PatternRewriter &rewriter) const override {
+    // Only move into immediately preceeding `assuming` op.
+    auto assuming_op =
+        llvm::dyn_cast_or_null<shape::AssumingOp>(op->getPrevNode());
+    if (!assuming_op) return failure();
+
+    Block *body = assuming_op.getBody();
+    auto yield_op = cast<shape::AssumingYieldOp>(body->getTerminator());
+
+    // Find the operands to use if the op was within the assuming region. We
+    // will later use their copies, as we copy the assuming op and its body.
+    SmallVector<Value, 8> new_operands_unmapped;
+    for (auto operand : op->getOperands()) {
+      new_operands_unmapped.push_back(operand);
+      for (auto result : llvm::enumerate(assuming_op->getResults())) {
+        if (result.value() == operand)
+          new_operands_unmapped.back() = yield_op->getOperand(result.index());
+      }
+    }
+
+    // Insert the rewritten assuming op right before the old one.
+    OpBuilder::InsertionGuard guard(rewriter);
+    rewriter.setInsertionPoint(assuming_op);
+    auto new_assuming_op = rewriter.create<shape::AssumingOp>(
+        assuming_op.getLoc(), assuming_op.witness(),
+        [&](OpBuilder &b, Location loc) {
+          // Copy body.
+          BlockAndValueMapping mapping;
+          for (auto &nested : body->without_terminator())
+            b.clone(nested, mapping);
+
+          // Copy op into the new body and use the mapped operands.
+          SmallVector<Value, 2> new_operands;
+          for (Value v_unmapped : new_operands_unmapped) {
+            Value v = mapping.lookupOrDefault(v_unmapped);
+            new_operands.push_back(v);
+          }
+          Value new_op = b.create<OpTy>(loc, op->getResultTypes(), new_operands,
+                                        op->getAttrs());
+
+          // Yield the previous results and also the new one.
+          SmallVector<Value, 2> mapped_results;
+          for (auto result : yield_op.operands())
+            mapped_results.push_back(mapping.lookupOrDefault(result));
+          mapped_results.push_back(new_op);
+          return mapped_results;
+        });
+
+    // Replace the assuming op and the root op with the corresponding result
+    // value.
+    ValueRange new_assuming_op_results = new_assuming_op->getResults();
+    rewriter.replaceOp(assuming_op, new_assuming_op_results.drop_back());
+    rewriter.replaceOp(op, new_assuming_op_results.back());
+    return success();
+  }
+};
+
 // TODO(frgossen): Only move up broadcasting operations if there is a consumer.
 struct MoveUpBroadcastInDimOpPattern
    : public OpRewritePattern<DynamicBroadcastInDimOp> {
@ -168,6 +234,8 @@ void PopulateMoveUpDynamicBroadcastsForFusionPatterns(
  // clang-format off
  patterns->insert<
      InlineBroadcastedShapeOperandsPattern<shape::CstrBroadcastableOp>,
+      MoveIntoAssumingOpPattern<shape::ShapeOfOp>,
+      MoveIntoAssumingOpPattern<shape::CstrBroadcastableOp>,
      MoveUpBroadcastInDimOpPattern,
      ShapeReificationPattern>(context);
  // clang-format on
--- a/tests/move_up_dynamic_broadcasts_for_fusion.mlir
+++ b/tests/move_up_dynamic_broadcasts_for_fusion.mlir
@ -110,3 +110,60 @@ func @inline_bcasted_shape_operands(%a : tensor<?xindex>, %b : tensor<?xindex>,
  %1 = shape.cstr_broadcastable %0, %c : tensor<?xindex>, tensor<?xindex>
  return %1 : !shape.witness
 }
+
+// -----
+
+// CHECK-LABEL: @move_shape_of_into_assuming
+// CHECK-SAME: (%[[ARG0:.*]]: !shape.witness, %[[ARG1:.*]]: tensor<?x32xf32>, %[[ARG2:.*]]: tensor<?x32xf32>)
+func @move_shape_of_into_assuming(%arg0 : !shape.witness,
+    %arg1 : tensor<?x32xf32>, %arg2 : tensor<?x32xf32>) -> tensor<3xindex> {
+  // CHECK:     %[[ASSUMING_RESULTS:.*]]:3 = shape.assuming %[[ARG0]] -> (tensor<?x32xf32>, tensor<?x32xf32>, tensor<3xindex>) {
+  // CHECK:       %[[SHAPE:.*]] = shape.shape_of %[[ARG2]]
+  // CHECK:       shape.assuming_yield %[[ARG1]], %[[ARG2]], %[[SHAPE]]
+  // CHECK:     }
+  // CHECK-NOT: shape_of
+  // CHECK:     return %[[ASSUMING_RESULTS]]#2
+  %0:2 = shape.assuming %arg0 -> (tensor<?x32xf32>, tensor<?x32xf32>) {
+    shape.assuming_yield %arg1, %arg2 : tensor<?x32xf32>, tensor<?x32xf32>
+  }
+  %1 = shape.shape_of %0#1 : tensor<?x32xf32> -> tensor<3xindex>
+  return %1 : tensor<3xindex>
+}
+
+// -----
+
+// CHECK-LABEL: @move_cstr_broadcastable_into_assuming
+// CHECK-SAME: (%[[ARG0:.*]]: !shape.witness, %[[ARG1:.*]]: tensor<2xindex>, %[[ARG2:.*]]: tensor<3xindex>)
+func @move_cstr_broadcastable_into_assuming(%arg0 : !shape.witness,
+    %arg1 : tensor<2xindex>, %arg2 : tensor<3xindex>) -> !shape.witness {
+  // CHECK:     %[[ASSUMING_RESULTS:.*]]:3 = shape.assuming %[[ARG0]] -> (tensor<2xindex>, tensor<3xindex>, !shape.witness) {
+  // CHECK:       %[[WITNESS:.*]] = shape.cstr_broadcastable %[[ARG1]], %[[ARG2]]
+  // CHECK:       shape.assuming_yield %[[ARG1]], %[[ARG2]], %[[WITNESS]]
+  // CHECK:     }
+  // CHECK-NOT: cstr_broadcastable
+  // CHECK:     return %[[ASSUMING_RESULTS]]#2
+  %0:2 = shape.assuming %arg0 -> (tensor<2xindex>, tensor<3xindex>) {
+    shape.assuming_yield %arg1, %arg2 : tensor<2xindex>, tensor<3xindex>
+  }
+  %1 = shape.cstr_broadcastable %arg1, %0#1 : tensor<2xindex>, tensor<3xindex>
+  return %1 : !shape.witness
+}
+
+// -----
+
+// CHECK-LABEL: @not_move_shape_of_into_assuming
+func @not_move_shape_of_into_assuming(%arg0 : !shape.witness,
+    %arg1 : tensor<?x32xf32>, %arg2 : tensor<?x32xf32>) -> tensor<3xindex> {
+  // CHECK:      shape.assuming
+  // CHECK-SAME: {
+  // CHECK-NOT:    shape_of
+  // CHECK:      }
+  // CHECK:     "some.other.op"
+  // CHECK:     shape_of
+  %0:2 = shape.assuming %arg0 -> (tensor<?x32xf32>, tensor<?x32xf32>) {
+    shape.assuming_yield %arg1, %arg2 : tensor<?x32xf32>, tensor<?x32xf32>
+  }
+  "some.other.op"() : () -> ()
+  %2 = shape.shape_of %0#1 : tensor<?x32xf32> -> tensor<3xindex>
+  return %2 : tensor<3xindex>
+}