[HLO] Add custom print/parse for convolution dimension numbers (in LMHLO)

PiperOrigin-RevId: 373379227
2021-05-12 08:51:40 -07:00 · 2021-05-12 08:51:40 -07:00 · e260aa771c
parent 30779f0c2f
commit e260aa771c
5 changed files with 348 additions and 1 deletions
--- a/include/mlir-hlo/Dialect/mhlo/IR/hlo_ops_base_structs.h
+++ b/include/mlir-hlo/Dialect/mhlo/IR/hlo_ops_base_structs.h
@ -21,10 +21,24 @@ limitations under the License.
 #include "mlir/IR/BuiltinAttributes.h"
 #include "mlir/IR/BuiltinTypes.h"
 #include "mlir/IR/Identifier.h"
+#include "mlir/IR/OpDefinition.h"
+#include "mlir/IR/OpImplementation.h"
 #include "mlir/IR/Types.h"

 // Order matters, this .inc header is not self-contained, and relies on the
 // #includes above.
 #include "mlir-hlo/Dialect/mhlo/IR/hlo_ops_base_structs.h.inc"

+namespace mlir {
+namespace mhlo {
+
+// Custom printer and parser for struct attributes.
+void printConvolutionDimensions(OpAsmPrinter &p, Operation *op,
+                                ConvDimensionNumbers dnums);
+ParseResult parseConvolutionDimensions(OpAsmParser &parser,
+                                       ConvDimensionNumbers &dnums);
+
+}  // namespace mhlo
+}  // namespace mlir
+
 #endif  // TENSORFLOW_COMPILER_MLIR_HLO_INCLUDE_MLIR_HLO_DIALECT_MHLO_IR_HLO_OPS_BASE_STRUCTS_H_
--- a/include/mlir-hlo/Dialect/mhlo/IR/lhlo_ops.td
+++ b/include/mlir-hlo/Dialect/mhlo/IR/lhlo_ops.td
@ -865,6 +865,12 @@ def LHLO_ConvOp : LHLO_Op<"convolution", []> {
                                      [](bool v) { return v; });
    }
  }];
+
+ let assemblyFormat = [{
+    `(`operands`)`
+       `dim_numbers` `=` custom<ConvolutionDimensions>($dimension_numbers)
+       attr-dict `:` functional-type(operands, results)
+  }];
 }

 def LHLO_CopyOp: LHLO_Op<"copy", [CopyOpInterface]> {
--- a/lib/Dialect/mhlo/IR/hlo_ops_base_structs.cc
+++ b/lib/Dialect/mhlo/IR/hlo_ops_base_structs.cc
@ -15,4 +15,209 @@ limitations under the License.

 #include "mlir-hlo/Dialect/mhlo/IR/hlo_ops_base_structs.h"

+#include <set>
+#include <unordered_map>
+
 #include "mlir-hlo/Dialect/mhlo/IR/hlo_ops_base_structs.cc.inc"
+#include "mlir/IR/Builders.h"
+#include "mlir/IR/BuiltinAttributes.h"
+
+namespace mlir {
+namespace mhlo {
+
+namespace {
+enum NonSpatialDim : int64_t {
+  IOBatch = -1,    // Input or output batch dimension
+  IOFeature = -2,  // Input or output feature dimension
+  KIFeature = -3,  // Kernel input feature dimension
+  KOFeature = -4,  // Kernel output feature dimensions.
+};
+
+char NonSpatialDimToString(NonSpatialDim dim) {
+  switch (dim) {
+    case IOBatch:
+      return 'b';
+    case IOFeature:
+      return 'f';
+    case KIFeature:
+      return 'i';
+    case KOFeature:
+      return 'o';
+  }
+}
+}  // namespace
+
+// Custom printer and parser for struct attributes.
+void printConvolutionDimensions(OpAsmPrinter &p, Operation * /*op*/,
+                                ConvDimensionNumbers dnums) {
+  auto print_dim =
+      [&p](DenseIntElementsAttr spatial_dims,
+           ArrayRef<std::pair<IntegerAttr, NonSpatialDim>> non_spatial_dims) {
+        llvm::SmallVector<int64_t> dims(non_spatial_dims.size() +
+                                        spatial_dims.size());
+        // Fill each element of dims with a (< 0) NonSpatialDim enum or a (>=0)
+        // spatial dimension index.
+        for (const std::pair<IntegerAttr, NonSpatialDim> &non_spatial_dim :
+             non_spatial_dims) {
+          dims[non_spatial_dim.first.getInt()] = non_spatial_dim.second;
+        }
+        for (auto spatial_dim :
+             llvm::enumerate(spatial_dims.getValues<int64_t>())) {
+          dims[spatial_dim.value()] = static_cast<int64_t>(spatial_dim.index());
+        }
+
+        // Each dimension numbers will be printed as a comma separated list
+        // surrounded by square brackets, e.g., [b, 0, 1, 2, f]
+        p << '[';
+        llvm::interleaveComma(dims, p, [&](int64_t dim) {
+          if (dim >= 0) {
+            p << dim;
+          } else {
+            p << NonSpatialDimToString(static_cast<NonSpatialDim>(dim));
+          }
+        });
+        p << ']';
+      };
+
+  print_dim(dnums.input_spatial_dimensions(),
+            {{dnums.input_batch_dimension(), IOBatch},
+             {dnums.input_feature_dimension(), IOFeature}});
+  p << "x";
+  print_dim(dnums.kernel_spatial_dimensions(),
+            {{dnums.kernel_input_feature_dimension(), KIFeature},
+             {dnums.kernel_output_feature_dimension(), KOFeature}});
+  p << "->";
+  print_dim(dnums.output_spatial_dimensions(),
+            {{dnums.output_batch_dimension(), IOBatch},
+             {dnums.output_feature_dimension(), IOFeature}});
+}
+
+ParseResult parseConvolutionDimensions(OpAsmParser &parser,
+                                       ConvDimensionNumbers &dnums) {
+  // Parsing a single set of dim numbers gives the spatial dimensions as a
+  // single DenseIntElementsAttr and a list of non-spatial dimensions as
+  // IntegerAttrs (indexed by the NonSpatialDim enum).
+  using parse_dim_result_t = std::pair<
+      DenseIntElementsAttr,
+      std::unordered_map<NonSpatialDim, IntegerAttr, std::hash<int64_t>>>;
+
+  // Note that the allowed_non_spatial_dims is a set (as opposed to unordered
+  // set) because its used to print a list of allowed non spatial dims in the
+  // error messages, so making it a set keeps the error messages deterministic.
+  auto parse_dims =
+      [&](std::set<NonSpatialDim, std::greater<>> allowed_non_spatial_dims,
+          parse_dim_result_t &parsed_dims) -> ParseResult {
+    // Parse the starting [
+    if (parser.parseLSquare()) {
+      return failure();
+    }
+    llvm::SmallVector<int64_t> spatial_dims;
+    std::unordered_map<NonSpatialDim, IntegerAttr, std::hash<int64_t>>
+        non_spatial_dims;
+
+    int64_t index = 0;
+    do {
+      int64_t spatial_dim;
+      OptionalParseResult parseResult =
+          parser.parseOptionalInteger(spatial_dim);
+      if (parseResult.hasValue()) {
+        if (parseResult.getValue().failed()) {
+          return failure();
+        }
+        // We were successful in parsing an integer. Add its index to the
+        // spatial dims.
+        spatial_dims.push_back(index);
+      } else {
+        // We did not parse an integer. We expect a keyword token.
+        StringRef keyword;
+        if (parser.parseKeyword(&keyword)) {
+          return failure();
+        }
+        if (keyword.size() != 1 || allowed_non_spatial_dims.empty()) {
+          return parser.emitError(parser.getCurrentLocation(),
+                                  "Unexpected keyword ")
+                 << keyword;
+        }
+        // Check if the keyword matches one of the allowed non-spatial dims.
+        // If so, add it to the non_spatial dims and remove it from the
+        // allowed set so that it won't be allowed again.
+        bool is_allowed = false;
+        for (NonSpatialDim allowed : allowed_non_spatial_dims) {
+          if (keyword[0] == NonSpatialDimToString(allowed)) {
+            non_spatial_dims.insert(
+                {allowed, parser.getBuilder().getI64IntegerAttr(index)});
+            allowed_non_spatial_dims.erase(allowed);
+            is_allowed = true;
+            break;
+          }
+        }
+
+        if (!is_allowed) {
+          mlir::InFlightDiagnostic diag = parser.emitError(
+              parser.getCurrentLocation(), "Unexpected dimension ");
+          diag << keyword << ", expecting ";
+          llvm::interleaveComma(
+              allowed_non_spatial_dims, diag,
+              [&](NonSpatialDim dim) { diag << NonSpatialDimToString(dim); });
+          return diag;
+        }
+      }
+      index++;
+    } while (parser.parseOptionalComma().succeeded());
+
+    // Make sure all expected non-spatial dimensions are parsed.
+    if (!allowed_non_spatial_dims.empty()) {
+      mlir::InFlightDiagnostic diag =
+          parser.emitError(parser.getCurrentLocation(), "Expected dimensions ");
+      llvm::interleaveComma(
+          allowed_non_spatial_dims, diag,
+          [&](NonSpatialDim dim) { diag << NonSpatialDimToString(dim); });
+      diag << " not specified";
+      return diag;
+    }
+
+    // parse ending ]
+    if (parser.parseRSquare()) {
+      return failure();
+    }
+
+    parsed_dims = std::make_pair(
+        parser.getBuilder().getI64TensorAttr(spatial_dims), non_spatial_dims);
+    return success();
+  };
+
+  parse_dim_result_t parsed_dims;
+  if (parse_dims({IOBatch, IOFeature}, parsed_dims)) {
+    return failure();
+  }
+  DenseIntElementsAttr input_spatial_dimensions = parsed_dims.first;
+  IntegerAttr input_batch_dimension = parsed_dims.second[IOBatch];
+  IntegerAttr input_feature_dimension = parsed_dims.second[IOFeature];
+  if (parser.parseKeyword("x")) return failure();
+  if (parse_dims({KIFeature, KOFeature}, parsed_dims)) {
+    return failure();
+  }
+  DenseIntElementsAttr kernel_spatial_dimensions = parsed_dims.first;
+  IntegerAttr kernel_input_feature_dimension = parsed_dims.second[KIFeature];
+  IntegerAttr kernel_output_feature_dimension = parsed_dims.second[KOFeature];
+  if (parser.parseArrow()) {
+    return failure();
+  }
+  if (parse_dims({IOBatch, IOFeature}, parsed_dims)) {
+    return failure();
+  }
+  DenseIntElementsAttr output_spatial_dimensions = parsed_dims.first;
+  IntegerAttr output_batch_dimension = parsed_dims.second[IOBatch];
+  IntegerAttr output_feature_dimension = parsed_dims.second[IOFeature];
+  dnums = ConvDimensionNumbers::get(
+      input_batch_dimension, input_feature_dimension, input_spatial_dimensions,
+      kernel_input_feature_dimension, kernel_output_feature_dimension,
+      kernel_spatial_dimensions, output_batch_dimension,
+      output_feature_dimension, output_spatial_dimensions,
+      parser.getBuilder().getContext());
+
+  return success();
+}
+
+}  // namespace mhlo
+}  // namespace mlir
--- a/tests/hlo-legalize-to-lhlo.mlir
+++ b/tests/hlo-legalize-to-lhlo.mlir
@ -518,7 +518,7 @@ func @conv(%input: tensor<3x5x5x3xf32>, %filter : tensor<2x2x3x4xf32>)
    -> tensor<3x5x5x4xf32> {
  %c0 = constant 0 : index
  // CHECK: %[[OUT:.*]] = memref.alloc() : memref<3x5x5x4xf32>
-  // CHECK: "lmhlo.convolution"(%{{.+}}, %{{.+}}, %[[OUT]])
+  // CHECK: lmhlo.convolution(%{{.+}}, %{{.+}}, %[[OUT]])
  // CHECK-SAME: padding = dense<[
  // CHECK-SAME:                  [0, 1], [0, 1]]> : tensor<2x2xi64>
  // CHECK-SAME: rhs_dilation = dense<[1, 2]>
--- a/tests/lhlo_ops.mlir
+++ b/tests/lhlo_ops.mlir
@ -171,6 +171,128 @@ func @convert_memref(%in: memref<10xf32>, %out: memref<9xi32>) -> () {

 // -----

+// CHECK-LABEL: func @convolution
+// CHECK: lmhlo.convolution
+// CHECK-SAME: dim_numbers = [b, 0, 1, f]x[0, 1, i, o]->[b, 0, 1, f]
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  "lmhlo.convolution"(%arg0, %arg1, %arg2) {batch_group_count = 1 : i64,
+    dimension_numbers = {input_batch_dimension = 0 : i64,
+                         input_feature_dimension = 3 : i64,
+                         input_spatial_dimensions = dense<[1, 2]> : tensor<2xi64>,
+                         kernel_input_feature_dimension = 2 : i64,
+                         kernel_output_feature_dimension = 3 : i64,
+                         kernel_spatial_dimensions = dense<[0, 1]> : tensor<2xi64>,
+                         output_batch_dimension = 0 : i64,
+                         output_feature_dimension = 3 : i64,
+                         output_spatial_dimensions = dense<[1, 2]> : tensor<2xi64>},
+    feature_group_count = 1 : i64,
+    padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+    rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+    window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()
+  return
+}
+
+// -----
+
+// CHECK-LABEL: func @convolution
+// CHECK: lmhlo.convolution
+// CHECK-SAME: dim_numbers = [b, 0, 1, f]x[0, 1, i, o]->[b, 0, 1, f]
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [b, 0, 1, f]x[0, 1, i, o]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{Unexpected dimension c, expecting b, f}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [c, 0, 1, f]x[0, 1, i, o]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{Unexpected dimension b, expecting i, o}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [b, 0, 1, f]x[0, 1, b, o]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{Unexpected dimension i, expecting o}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [b, 0, 1, f]x[0, 1, i, i]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{Expected dimensions f not specified}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [b, 0, 1]x[0, 1, i, o]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{Unexpected keyword b}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = [b, 0, 1, f]x[0, 1, i, o, b]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
+
+func @convolution(%arg0: memref<2x2x3x4xf32>, %arg1: memref<3x5x5x3xf32>, %arg2: memref<3x5x5x4xf32>) {
+  // expected-error@+2{{expected '['}}
+  lmhlo.convolution(%arg0, %arg1, %arg2)
+     dim_numbers = {b, 0, 1, f]x[0, 1, i, o]->[b, 0, 1, f]
+     { batch_group_count = 1 : i64, feature_group_count = 1 : i64,
+       padding = dense<[[0, 1], [0, 1]]> : tensor<2x2xi64>,
+       rhs_dilation = dense<[1, 2]> : tensor<2xi64>,
+       window_strides = dense<[2, 1]> : tensor<2xi64>}
+  : (memref<2x2x3x4xf32>, memref<3x5x5x3xf32>, memref<3x5x5x4xf32>) -> ()  return
+  return
+}
+
+// -----
 // CHECK-LABEL: func @exp
 func @exp(%input: memref<2x2xf32>, %result: memref<2x2xf32>) {
  "lmhlo.exponential"(%input, %result) : (memref<2x2xf32>, memref<2x2xf32>) -> ()