mlir-hlo/lib/Dialect/mhlo/transforms/lhlo_legalize_to_gpu.cc

/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

    http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/

// This file implements logic for lowering LHLO dialect to GPU dialect.

#include <cstdint>

#include "llvm/ADT/ArrayRef.h"
#include "mlir-hlo/Dialect/mhlo/IR/lhlo_ops.h"
#include "mlir-hlo/Dialect/mhlo/transforms/PassDetail.h"
#include "mlir-hlo/Dialect/mhlo/transforms/map_lmhlo_to_scalar_op.h"
#include "mlir/Dialect/Affine/IR/AffineOps.h"
#include "mlir/Dialect/GPU/GPUDialect.h"
#include "mlir/Dialect/Linalg/IR/LinalgOps.h"
#include "mlir/Dialect/Linalg/IR/LinalgTypes.h"
#include "mlir/Dialect/MemRef/IR/MemRef.h"
#include "mlir/Dialect/SCF/SCF.h"
#include "mlir/Dialect/StandardOps/IR/Ops.h"
#include "mlir/IR/Attributes.h"
#include "mlir/IR/BlockAndValueMapping.h"
#include "mlir/IR/Builders.h"
#include "mlir/IR/BuiltinOps.h"
#include "mlir/IR/BuiltinTypes.h"
#include "mlir/IR/Location.h"
#include "mlir/IR/MLIRContext.h"
#include "mlir/IR/Operation.h"
#include "mlir/IR/PatternMatch.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Transforms/DialectConversion.h"

namespace mlir {
namespace lmhlo {
namespace {

// A simple translation of LHLO reduce operations to a corresponding gpu
// launch operation. The transformation does no tiling and also only supports
// 1d results.
class LhloReduceToGPULaunchConverter : public OpConversionPattern<ReduceOp> {
 public:
  using OpConversionPattern::OpConversionPattern;

  LogicalResult matchAndRewrite(
      ReduceOp reduce_op, ArrayRef<Value> args,
      ConversionPatternRewriter& rewriter) const final {
    auto loc = reduce_op.getLoc();
    // Only support 1d reductions for now.
    int64_t size = 0;
    for (auto result : reduce_op.out()) {
      auto shaped_type = result.getType().dyn_cast<ShapedType>();
      if (!shaped_type || shaped_type.getRank() != 1) {
        return failure();
      }
      auto dim_size = shaped_type.getDimSize(0);
      if (size && size != dim_size) {
        return failure();
      }
      size = dim_size;
    }

    auto reducing_dimension = *reduce_op.dimensions().int_value_begin();

    // Require all inputs to have the same shape.
    int64_t reduce_dim_size = 0;
    for (auto input : reduce_op.inputs()) {
      auto shaped_type = input.getType().dyn_cast<ShapedType>();
      if (!shaped_type || !shaped_type.hasStaticShape()) {
        return failure();
      }
      reduce_dim_size =
          shaped_type.getDimSize(reducing_dimension.getSExtValue());
    }

    // Create a launch that is parallel in the result dimension.
    auto block_size_x = rewriter.create<mlir::ConstantOp>(
        loc, rewriter.getIndexType(),
        rewriter.getIntegerAttr(rewriter.getIndexType(), size));
    auto one = rewriter.create<mlir::ConstantOp>(
        loc, rewriter.getIndexType(),
        rewriter.getIntegerAttr(rewriter.getIndexType(), 1));
    auto launch_op = rewriter.create<mlir::gpu::LaunchOp>(
        loc, one, one, one, block_size_x, one, one);
    {
      OpBuilder::InsertionGuard guard(rewriter);
      rewriter.setInsertionPointToEnd(&launch_op.body().front());
      auto index = launch_op.getThreadIds().x;

      // Load the initial value and store it to the output.
      for (auto pair : llvm::zip(reduce_op.init_values(), reduce_op.out())) {
        auto init_value =
            rewriter.create<mlir::memref::LoadOp>(loc, std::get<0>(pair));
        rewriter.create<mlir::memref::StoreOp>(
            loc, init_value, std::get<1>(pair), ArrayRef<Value>{index});
      }

      // Insert a loop into the body to compute the reduction. The loop ranges
      // from [0.dim).
      auto zero = rewriter.create<mlir::ConstantOp>(
          loc, rewriter.getIndexType(),
          rewriter.getIntegerAttr(rewriter.getIndexType(), 0));
      // TODO(b/137624192) Use dimOp to make it shape independent.
      auto upper = rewriter.create<mlir::ConstantOp>(
          loc, rewriter.getIndexType(),
          rewriter.getIntegerAttr(rewriter.getIndexType(), reduce_dim_size));
      auto step = rewriter.create<mlir::ConstantOp>(
          loc, rewriter.getIndexType(),
          rewriter.getIntegerAttr(rewriter.getIndexType(), 1));
      auto loop = rewriter.create<mlir::scf::ForOp>(loc, zero, upper, step);

      rewriter.setInsertionPointToStart(loop.getBody());
      // Compute memrefs for the value to reduce. This makes it easier to just
      // inline the body.
      auto output = *reduce_op.out().begin();
      auto resType = MemRefType::get(
          llvm::None, getElementTypeOrSelf(output.getType()),
          makeStridedLinearLayoutMap(llvm::None,
                                     MemRefType::getDynamicStrideOrOffset(),
                                     rewriter.getContext()));
      OpFoldResult offset = launch_op.getThreadIds().x;
      auto oneAttr = rewriter.getI64IntegerAttr(1);
      OpFoldResult size = oneAttr;
      OpFoldResult stride = oneAttr;
      auto accumulator = rewriter.create<memref::SubViewOp>(
          loc, resType, output, offset, size, stride);
      llvm::SmallVector<Value, 4> indexings;
      Value input_buffer = reduce_op.inputs().front();
      auto input_type_rank =
          input_buffer.getType().cast<MemRefType>().getRank();

      Value input = *reduce_op.operand_begin();
      SmallVector<OpFoldResult> offsets = llvm::to_vector<4>(llvm::map_range(
          llvm::seq<int>(0, input_type_rank), [&](int dim) -> OpFoldResult {
            return dim == reducing_dimension ? loop.getInductionVar()
                                             : launch_op.getThreadIds().x;
          }));
      SmallVector<OpFoldResult> sizes(input_type_rank, oneAttr);
      SmallVector<OpFoldResult> strides(input_type_rank, oneAttr);
      auto rhs = rewriter.create<memref::SubViewOp>(
          loc, accumulator.getType(), input, offsets, sizes, strides);

      // Now copy over the actual body of the reduction, leaving out the
      // terminator.
      BlockAndValueMapping mapping;
      mapping.map(reduce_op.body().getArgument(0), accumulator);
      mapping.map(reduce_op.body().getArgument(1), rhs);
      mapping.map(reduce_op.body().getArgument(2), accumulator);
      for (auto& nested : reduce_op.body().front().without_terminator()) {
        auto clone = rewriter.clone(nested, mapping);
        for (auto pair : llvm::zip(nested.getResults(), clone->getResults())) {
          mapping.map(std::get<0>(pair), std::get<1>(pair));
        }
      }

      // Finally, insert the terminator for the launchOp.
      rewriter.setInsertionPointToEnd(&launch_op.body().front());
      rewriter.create<mlir::gpu::TerminatorOp>(loc);
    }

    rewriter.eraseOp(reduce_op);
    return success();
  };
};

struct LhloLegalizeToGpuPass
    : public LhloLegalizeToGpuPassBase<LhloLegalizeToGpuPass> {
  void getDependentDialects(DialectRegistry& registry) const override {
    registry.insert<AffineDialect, gpu::GPUDialect, linalg::LinalgDialect,
                    memref::MemRefDialect, scf::SCFDialect>();
  }

  void runOnFunction() override {
    OwningRewritePatternList patterns(&getContext());
    ConversionTarget target(getContext());
    target.addLegalDialect<linalg::LinalgDialect, memref::MemRefDialect,
                           StandardOpsDialect, gpu::GPUDialect, scf::SCFDialect,
                           LmhloDialect>();
    target.addIllegalOp<ReduceOp>();
    auto func = getFunction();
    patterns.insert<LhloReduceToGPULaunchConverter>(func.getContext());
    if (failed(applyPartialConversion(func, target, std::move(patterns)))) {
      signalPassFailure();
    }
  }
};

}  // namespace

std::unique_ptr<FunctionPass> createLegalizeToGpuPass() {
  return std::make_unique<LhloLegalizeToGpuPass>();
}

}  // namespace lmhlo
}  // namespace mlir
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.`

			`Licensed under the Apache License, Version 2.0 (the "License");`
			`you may not use this file except in compliance with the License.`
			`You may obtain a copy of the License at`

			`http://www.apache.org/licenses/LICENSE-2.0`

			`Unless required by applicable law or agreed to in writing, software`
			`distributed under the License is distributed on an "AS IS" BASIS,`
			`WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`See the License for the specific language governing permissions and`
			`limitations under the License.`
			`==============================================================================*/`

			`// This file implements logic for lowering LHLO dialect to GPU dialect.`

			`#include <cstdint>`

More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`#include "llvm/ADT/ArrayRef.h"`
			`#include "mlir-hlo/Dialect/mhlo/IR/lhlo_ops.h"`
Fix pass definition to inherit from the TableGen generated base class (NFC) PiperOrigin-RevId: 379860210 2021-06-17 10:04:23 +08:00			`#include "mlir-hlo/Dialect/mhlo/transforms/PassDetail.h"`
More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`#include "mlir-hlo/Dialect/mhlo/transforms/map_lmhlo_to_scalar_op.h"`
Remove the dependency on global dialect registry from mlir-hlo PiperOrigin-RevId: 328457105 2020-08-26 11:30:05 +08:00			`#include "mlir/Dialect/Affine/IR/AffineOps.h"`
More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`#include "mlir/Dialect/GPU/GPUDialect.h"`
			`#include "mlir/Dialect/Linalg/IR/LinalgOps.h"`
Remove the dependency on global dialect registry from mlir-hlo PiperOrigin-RevId: 328457105 2020-08-26 11:30:05 +08:00			`#include "mlir/Dialect/Linalg/IR/LinalgTypes.h"`
mlir-hlo-opt: set preloadDialectsInContext to false. This requires specifying dependent dialects in several passes. PiperOrigin-RevId: 365758084 2021-03-30 16:06:12 +08:00			`#include "mlir/Dialect/MemRef/IR/MemRef.h"`
More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`#include "mlir/Dialect/SCF/SCF.h"`
			`#include "mlir/Dialect/StandardOps/IR/Ops.h"`
			`#include "mlir/IR/Attributes.h"`
			`#include "mlir/IR/BlockAndValueMapping.h"`
			`#include "mlir/IR/Builders.h"`
[mlir][NFC] Replace usages of Function.h and Module.h with BuiltinOps.h This is part of a larger refactoring cleaning up the BuiltinDialect of MLIR. PiperOrigin-RevId: 345085278 2020-12-02 05:17:12 +08:00			`#include "mlir/IR/BuiltinOps.h"`
[mlir][NFC] Replace usages or mlir/IR/StandardTypes.h with mlir/IR/BuiltinTypes.h StandardTypes.h was moved to BuiltinTypes.h and is being removed. PiperOrigin-RevId: 347559927 2020-12-15 16:58:42 +08:00			`#include "mlir/IR/BuiltinTypes.h"`
More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`#include "mlir/IR/Location.h"`
			`#include "mlir/IR/MLIRContext.h"`
			`#include "mlir/IR/Operation.h"`
			`#include "mlir/IR/PatternMatch.h"`
			`#include "mlir/Pass/Pass.h"`
			`#include "mlir/Transforms/DialectConversion.h"`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00
			`namespace mlir {`
Rename xla_lhlo dialect into lmhlo Following on the plan of isolating the compiler/mlir/hlo directory. Another xla_lhlo dialect will be created under compiler/mlir/xla/ later. PiperOrigin-RevId: 320210326 2020-07-09 01:05:32 +08:00			`namespace lmhlo {`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`namespace {`

			`// A simple translation of LHLO reduce operations to a corresponding gpu`
			`// launch operation. The transformation does no tiling and also only supports`
			`// 1d results.`
			`class LhloReduceToGPULaunchConverter : public OpConversionPattern<ReduceOp> {`
			`public:`
			`using OpConversionPattern::OpConversionPattern;`

			`LogicalResult matchAndRewrite(`
			`ReduceOp reduce_op, ArrayRef<Value> args,`
			`ConversionPatternRewriter& rewriter) const final {`
			`auto loc = reduce_op.getLoc();`
			`// Only support 1d reductions for now.`
			`int64_t size = 0;`
			`for (auto result : reduce_op.out()) {`
			`auto shaped_type = result.getType().dyn_cast<ShapedType>();`
			`if (!shaped_type \|\| shaped_type.getRank() != 1) {`
			`return failure();`
			`}`
			`auto dim_size = shaped_type.getDimSize(0);`
			`if (size && size != dim_size) {`
			`return failure();`
			`}`
			`size = dim_size;`
			`}`

			`auto reducing_dimension = *reduce_op.dimensions().int_value_begin();`

			`// Require all inputs to have the same shape.`
			`int64_t reduce_dim_size = 0;`
[MLIR][NFC] Rename ReduceOp operands() => inputs(). - Rename to avoid confusion as operands generally includes all operands of an operation PiperOrigin-RevId: 368479524 2021-04-15 03:05:33 +08:00			`for (auto input : reduce_op.inputs()) {`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`auto shaped_type = input.getType().dyn_cast<ShapedType>();`
			`if (!shaped_type \|\| !shaped_type.hasStaticShape()) {`
			`return failure();`
			`}`
			`reduce_dim_size =`
			`shaped_type.getDimSize(reducing_dimension.getSExtValue());`
			`}`

			`// Create a launch that is parallel in the result dimension.`
			`auto block_size_x = rewriter.create<mlir::ConstantOp>(`
			`loc, rewriter.getIndexType(),`
			`rewriter.getIntegerAttr(rewriter.getIndexType(), size));`
			`auto one = rewriter.create<mlir::ConstantOp>(`
			`loc, rewriter.getIndexType(),`
			`rewriter.getIntegerAttr(rewriter.getIndexType(), 1));`
			`auto launch_op = rewriter.create<mlir::gpu::LaunchOp>(`
			`loc, one, one, one, block_size_x, one, one);`
			`{`
			`OpBuilder::InsertionGuard guard(rewriter);`
			`rewriter.setInsertionPointToEnd(&launch_op.body().front());`
			`auto index = launch_op.getThreadIds().x;`

			`// Load the initial value and store it to the output.`
			`for (auto pair : llvm::zip(reduce_op.init_values(), reduce_op.out())) {`
Integrate LLVM at llvm/llvm-project@678241795c95 Updates LLVM usage to match [678241795c95](https://github.com/llvm/llvm-project/commit/678241795c95) PiperOrigin-RevId: 363257913 2021-03-17 04:31:59 +08:00			`auto init_value =`
			`rewriter.create<mlir::memref::LoadOp>(loc, std::get<0>(pair));`
			`rewriter.create<mlir::memref::StoreOp>(`
			`loc, init_value, std::get<1>(pair), ArrayRef<Value>{index});`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`}`

			`// Insert a loop into the body to compute the reduction. The loop ranges`
			`// from [0.dim).`
			`auto zero = rewriter.create<mlir::ConstantOp>(`
			`loc, rewriter.getIndexType(),`
			`rewriter.getIntegerAttr(rewriter.getIndexType(), 0));`
			`// TODO(b/137624192) Use dimOp to make it shape independent.`
			`auto upper = rewriter.create<mlir::ConstantOp>(`
			`loc, rewriter.getIndexType(),`
			`rewriter.getIntegerAttr(rewriter.getIndexType(), reduce_dim_size));`
			`auto step = rewriter.create<mlir::ConstantOp>(`
			`loc, rewriter.getIndexType(),`
			`rewriter.getIntegerAttr(rewriter.getIndexType(), 1));`
			`auto loop = rewriter.create<mlir::scf::ForOp>(loc, zero, upper, step);`

			`rewriter.setInsertionPointToStart(loop.getBody());`
			`// Compute memrefs for the value to reduce. This makes it easier to just`
			`// inline the body.`
			`auto output = *reduce_op.out().begin();`
			`auto resType = MemRefType::get(`
Integrate LLVM at llvm/llvm-project@91e7a1713332 Updates LLVM usage to match [91e7a1713332](https://github.com/llvm/llvm-project/commit/91e7a1713332) PiperOrigin-RevId: 355702100 2021-02-05 05:41:18 +08:00			`llvm::None, getElementTypeOrSelf(output.getType()),`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`makeStridedLinearLayoutMap(llvm::None,`
			`MemRefType::getDynamicStrideOrOffset(),`
			`rewriter.getContext()));`
Integrate LLVM at llvm/llvm-project@91e7a1713332 Updates LLVM usage to match [91e7a1713332](https://github.com/llvm/llvm-project/commit/91e7a1713332) PiperOrigin-RevId: 355702100 2021-02-05 05:41:18 +08:00			`OpFoldResult offset = launch_op.getThreadIds().x;`
			`auto oneAttr = rewriter.getI64IntegerAttr(1);`
			`OpFoldResult size = oneAttr;`
			`OpFoldResult stride = oneAttr;`
Integrate LLVM at llvm/llvm-project@678241795c95 Updates LLVM usage to match [678241795c95](https://github.com/llvm/llvm-project/commit/678241795c95) PiperOrigin-RevId: 363257913 2021-03-17 04:31:59 +08:00			`auto accumulator = rewriter.create<memref::SubViewOp>(`
			`loc, resType, output, offset, size, stride);`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`llvm::SmallVector<Value, 4> indexings;`
[MLIR][NFC] Rename ReduceOp operands() => inputs(). - Rename to avoid confusion as operands generally includes all operands of an operation PiperOrigin-RevId: 368479524 2021-04-15 03:05:33 +08:00			`Value input_buffer = reduce_op.inputs().front();`
Integrate LLVM at llvm/llvm-project@91e7a1713332 Updates LLVM usage to match [91e7a1713332](https://github.com/llvm/llvm-project/commit/91e7a1713332) PiperOrigin-RevId: 355702100 2021-02-05 05:41:18 +08:00			`auto input_type_rank =`
			`input_buffer.getType().cast<MemRefType>().getRank();`

			`Value input = *reduce_op.operand_begin();`
			`SmallVector<OpFoldResult> offsets = llvm::to_vector<4>(llvm::map_range(`
			`llvm::seq<int>(0, input_type_rank), [&](int dim) -> OpFoldResult {`
			`return dim == reducing_dimension ? loop.getInductionVar()`
			`: launch_op.getThreadIds().x;`
			`}));`
			`SmallVector<OpFoldResult> sizes(input_type_rank, oneAttr);`
			`SmallVector<OpFoldResult> strides(input_type_rank, oneAttr);`
Integrate LLVM at llvm/llvm-project@678241795c95 Updates LLVM usage to match [678241795c95](https://github.com/llvm/llvm-project/commit/678241795c95) PiperOrigin-RevId: 363257913 2021-03-17 04:31:59 +08:00			`auto rhs = rewriter.create<memref::SubViewOp>(`
			`loc, accumulator.getType(), input, offsets, sizes, strides);`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00
			`// Now copy over the actual body of the reduction, leaving out the`
			`// terminator.`
			`BlockAndValueMapping mapping;`
[MLIR][NFC] Adopt FuncOp/Region argument API's. - Use FuncOp::getArguments() and Region::getArguments() and friends where possible instead of going through the front() block. PiperOrigin-RevId: 325352975 2020-08-07 09:31:33 +08:00			`mapping.map(reduce_op.body().getArgument(0), accumulator);`
			`mapping.map(reduce_op.body().getArgument(1), rhs);`
			`mapping.map(reduce_op.body().getArgument(2), accumulator);`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`for (auto& nested : reduce_op.body().front().without_terminator()) {`
			`auto clone = rewriter.clone(nested, mapping);`
			`for (auto pair : llvm::zip(nested.getResults(), clone->getResults())) {`
			`mapping.map(std::get<0>(pair), std::get<1>(pair));`
			`}`
			`}`

			`// Finally, insert the terminator for the launchOp.`
			`rewriter.setInsertionPointToEnd(&launch_op.body().front());`
			`rewriter.create<mlir::gpu::TerminatorOp>(loc);`
			`}`

			`rewriter.eraseOp(reduce_op);`
			`return success();`
			`};`
			`};`

More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`struct LhloLegalizeToGpuPass`
Fix pass definition to inherit from the TableGen generated base class (NFC) PiperOrigin-RevId: 379860210 2021-06-17 10:04:23 +08:00			`: public LhloLegalizeToGpuPassBase<LhloLegalizeToGpuPass> {`
Remove the dependency on global dialect registry from mlir-hlo PiperOrigin-RevId: 328457105 2020-08-26 11:30:05 +08:00			`void getDependentDialects(DialectRegistry& registry) const override {`
			`registry.insert<AffineDialect, gpu::GPUDialect, linalg::LinalgDialect,`
mlir-hlo-opt: set preloadDialectsInContext to false. This requires specifying dependent dialects in several passes. PiperOrigin-RevId: 365758084 2021-03-30 16:06:12 +08:00			`memref::MemRefDialect, scf::SCFDialect>();`
Remove the dependency on global dialect registry from mlir-hlo PiperOrigin-RevId: 328457105 2020-08-26 11:30:05 +08:00			`}`

Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`void runOnFunction() override {`
Integrate LLVM at llvm/llvm-project@b24436ac96bd Updates LLVM usage to match [b24436ac96bd](https://github.com/llvm/llvm-project/commit/b24436ac96bd) PiperOrigin-RevId: 364615807 2021-03-24 03:18:57 +08:00			`OwningRewritePatternList patterns(&getContext());`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`ConversionTarget target(getContext());`
Integrate LLVM at llvm/llvm-project@678241795c95 Updates LLVM usage to match [678241795c95](https://github.com/llvm/llvm-project/commit/678241795c95) PiperOrigin-RevId: 363257913 2021-03-17 04:31:59 +08:00			`target.addLegalDialect<linalg::LinalgDialect, memref::MemRefDialect,`
			`StandardOpsDialect, gpu::GPUDialect, scf::SCFDialect,`
			`LmhloDialect>();`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`target.addIllegalOp<ReduceOp>();`
			`auto func = getFunction();`
			`patterns.insert<LhloReduceToGPULaunchConverter>(func.getContext());`
Integrate LLVM at llvm/llvm-project@0fc1aa22ee6a Updates LLVM usage to match [0fc1aa22ee6a](https://github.com/llvm/llvm-project/commit/0fc1aa22ee6a) PiperOrigin-RevId: 339239851 2020-10-27 21:55:28 +08:00			`if (failed(applyPartialConversion(func, target, std::move(patterns)))) {`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`signalPassFailure();`
			`}`
			`}`
			`};`

			`} // namespace`

More cleanup in mlir-hlo to prepare for the standalone build Shuffle files around, use TableGen to register passes, and introduce a `mlir-hlo-opt.cpp` file to hold the main entry point of the -opt tool and stop relying on static registration for dialect/passes. PiperOrigin-RevId: 323674455 2020-07-29 07:12:08 +08:00			`std::unique_ptr<FunctionPass> createLegalizeToGpuPass() {`
			`return std::make_unique<LhloLegalizeToGpuPass>();`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`}`

Rename xla_lhlo dialect into lmhlo Following on the plan of isolating the compiler/mlir/hlo directory. Another xla_lhlo dialect will be created under compiler/mlir/xla/ later. PiperOrigin-RevId: 320210326 2020-07-09 01:05:32 +08:00			`} // namespace lmhlo`
Move XLA-independent transforms to the new MLIR-HLO directory This is as straighforward as possible, more cleanup/rewrite to come. PiperOrigin-RevId: 319849713 2020-07-07 04:57:00 +08:00			`} // namespace mlir`