onnx-mlir/src/Conversion/ONNXToKrnl/Tensor/Split.cpp

//===---------------- Split.cpp - Lowering Split Op -----------------------===//
//
// Copyright 2019 The IBM Research Authors.
//
// =============================================================================
//
// This file lowers the ONNX Split Operator to Krnl dialect.
//
//===----------------------------------------------------------------------===//

#include "src/Conversion/ONNXToKrnl/ONNXToKrnlCommon.hpp"

using namespace mlir;

struct ONNXSplitOpLowering : public ConversionPattern {
  ONNXSplitOpLowering(MLIRContext *ctx)
      : ConversionPattern(mlir::ONNXSplitOp::getOperationName(), 1, ctx) {}

  LogicalResult matchAndRewrite(Operation *op, ArrayRef<Value> operands,
      ConversionPatternRewriter &rewriter) const final {
    // Gather info.
    auto loc = op->getLoc();
    ONNXSplitOp splitOp = llvm::dyn_cast<ONNXSplitOp>(op);
    auto axis = splitOp.axis().getSExtValue();
    auto split = splitOp.split().getValue();
    SmallVector<int64_t, 4> splitOffset;
    int64_t offset = 0;
    for (int i = 0; i < split.size(); ++i) {
      splitOffset.emplace_back(offset);
      offset += ArrayAttrIntVal(split, i);
    }
    auto rank = splitOp.input().getType().cast<ShapedType>().getRank();
    auto outputNum = splitOp.getNumResults();

    // Alloc and dealloc.
    SmallVector<Value, 4> allocs;
    for (int i = 0; i < outputNum; ++i) {
      Value alloc;
      bool insertDealloc = checkInsertDealloc(op, i);
      auto memRefType = convertToMemRefType(splitOp.outputs()[i].getType());

      if (hasAllConstantDimensions(memRefType))
        alloc = insertAllocAndDealloc(memRefType, loc, rewriter, insertDealloc);
      else {
        SmallVector<Value, 4> allocOperands;
        auto shape = memRefType.getShape();
        for (decltype(rank) r = 0; r < rank; ++r) {
          if (shape[r] < 0) {
            Value dim;
            if (r != axis)
              dim = rewriter.create<DimOp>(loc, operands[0], r);
            else
              dim = emitConstantOp(rewriter, loc, rewriter.getIndexType(),
                  ArrayAttrIntVal(split, i));
            allocOperands.push_back(dim);
          }
        }
        alloc = rewriter.create<AllocOp>(loc, memRefType, allocOperands);
        if (insertDealloc) {
          auto *parentBlock = alloc.getDefiningOp()->getBlock();
          auto dealloc = rewriter.create<DeallocOp>(loc, alloc);
          dealloc.getOperation()->moveBefore(&parentBlock->back());
        }
      }
      allocs.emplace_back(alloc);
    }

    // Creates loops, one for each output.
    for (int i = 0; i < outputNum; ++i) {
      OpBuilder::InsertionGuard insertGuard(rewriter);
      // Create loop.
      BuildKrnlLoop outputLoops(rewriter, loc, rank);
      outputLoops.createDefineAndIterateOp(allocs[i]);
      outputLoops.createIterateOp();
      rewriter.setInsertionPointToStart(outputLoops.getIterateBlock());
      // Indices for the read and write.
      SmallVector<Value, 4> readIndices;
      SmallVector<Value, 4> writeIndices;
      for (int r = 0; r < rank; ++r) {
        // Same index for read and write if the dimension is:
        //  - the first dimension, or
        //  - not the split axis.
        if (i == 0 || r != axis) {
          readIndices.emplace_back(outputLoops.getInductionVar(r));
        } else {
          auto index = rewriter.getAffineDimExpr(0);
          auto indexMap = AffineMap::get(1, 0, index + splitOffset[i]);
          auto indexWithOffset = rewriter.create<AffineApplyOp>(loc, indexMap,
              ArrayRef<Value>{/*index=*/outputLoops.getInductionVar(r)});
          readIndices.emplace_back(indexWithOffset);
        }
        writeIndices.emplace_back(outputLoops.getInductionVar(r));
      }
      // Insert copy.
      auto loadData =
          rewriter.create<AffineLoadOp>(loc, operands[0], readIndices);
      rewriter.create<AffineStoreOp>(loc, loadData, allocs[i], writeIndices);
    }
    rewriter.replaceOp(op, allocs);
    return success();
  }
};

void populateLoweringONNXSplitOpPattern(
    OwningRewritePatternList &patterns, MLIRContext *ctx) {
  patterns.insert<ONNXSplitOpLowering>(ctx);
}
Lower SplitOp to Krnl dialect (#155) * Fix importing variadic output * Lower splitop * Support unknown dimension and add lit tests Co-authored-by: Tian Jin <tjingrant@gmail.com> 2020-06-11 10:57:20 +08:00			`//===---------------- Split.cpp - Lowering Split Op -----------------------===//`
			`//`
			`// Copyright 2019 The IBM Research Authors.`
			`//`
			`// =============================================================================`
			`//`
			`// This file lowers the ONNX Split Operator to Krnl dialect.`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "src/Conversion/ONNXToKrnl/ONNXToKrnlCommon.hpp"`

			`using namespace mlir;`

			`struct ONNXSplitOpLowering : public ConversionPattern {`
			`ONNXSplitOpLowering(MLIRContext *ctx)`
			`: ConversionPattern(mlir::ONNXSplitOp::getOperationName(), 1, ctx) {}`

			`LogicalResult matchAndRewrite(Operation *op, ArrayRef<Value> operands,`
			`ConversionPatternRewriter &rewriter) const final {`
			`// Gather info.`
			`auto loc = op->getLoc();`
			`ONNXSplitOp splitOp = llvm::dyn_cast<ONNXSplitOp>(op);`
			`auto axis = splitOp.axis().getSExtValue();`
			`auto split = splitOp.split().getValue();`
			`SmallVector<int64_t, 4> splitOffset;`
			`int64_t offset = 0;`
			`for (int i = 0; i < split.size(); ++i) {`
			`splitOffset.emplace_back(offset);`
			`offset += ArrayAttrIntVal(split, i);`
			`}`
			`auto rank = splitOp.input().getType().cast<ShapedType>().getRank();`
			`auto outputNum = splitOp.getNumResults();`

			`// Alloc and dealloc.`
			`SmallVector<Value, 4> allocs;`
			`for (int i = 0; i < outputNum; ++i) {`
			`Value alloc;`
			`bool insertDealloc = checkInsertDealloc(op, i);`
			`auto memRefType = convertToMemRefType(splitOp.outputs()[i].getType());`

			`if (hasAllConstantDimensions(memRefType))`
			`alloc = insertAllocAndDealloc(memRefType, loc, rewriter, insertDealloc);`
			`else {`
			`SmallVector<Value, 4> allocOperands;`
			`auto shape = memRefType.getShape();`
			`for (decltype(rank) r = 0; r < rank; ++r) {`
			`if (shape[r] < 0) {`
			`Value dim;`
			`if (r != axis)`
			`dim = rewriter.create<DimOp>(loc, operands[0], r);`
			`else`
			`dim = emitConstantOp(rewriter, loc, rewriter.getIndexType(),`
			`ArrayAttrIntVal(split, i));`
			`allocOperands.push_back(dim);`
			`}`
			`}`
			`alloc = rewriter.create<AllocOp>(loc, memRefType, allocOperands);`
			`if (insertDealloc) {`
			`auto *parentBlock = alloc.getDefiningOp()->getBlock();`
			`auto dealloc = rewriter.create<DeallocOp>(loc, alloc);`
			`dealloc.getOperation()->moveBefore(&parentBlock->back());`
			`}`
			`}`
			`allocs.emplace_back(alloc);`
			`}`

			`// Creates loops, one for each output.`
			`for (int i = 0; i < outputNum; ++i) {`
			`OpBuilder::InsertionGuard insertGuard(rewriter);`
			`// Create loop.`
			`BuildKrnlLoop outputLoops(rewriter, loc, rank);`
Remove optimize_loops/return_loops op. (#200) * Remove optimize_loops/return_loops op in elementwise ops lowering and fix tests in onnx_lowering.mlir. * Fix all tests. * Remove all occurences of def_loops/return_loops. * Fix test. * Fix comments for defineLoops & emitKrnlLoopsAndIterationForOperand function. * Remove emitOptimizedLoops. * Allow not specifying optimizedLoops when creating KrnlIterateOperandPack. * Fix style. * Make BuildKernelLoop helper not emit optimize/return_loop operations & retire emitKrnlLoopsAndIterationForOperand by replacing it with BuildKernelLoop. * DefineLoops -> DefineLoopsEx, remove redundant emitKrnlLoopsAndIterationForOperand function. * BuildKrnlLoop API name update. * Tweak comments. * Remove unused withEmptyOptimization flag. * Better comment for BuildKrnlLoop. * Fully remove krnl.return_loops/optimize_loops op. * Trigger Windows Build * Bump windows ci python version. 2020-07-08 12:49:15 +08:00			`outputLoops.createDefineAndIterateOp(allocs[i]);`
Lower SplitOp to Krnl dialect (#155) * Fix importing variadic output * Lower splitop * Support unknown dimension and add lit tests Co-authored-by: Tian Jin <tjingrant@gmail.com> 2020-06-11 10:57:20 +08:00			`outputLoops.createIterateOp();`
			`rewriter.setInsertionPointToStart(outputLoops.getIterateBlock());`
			`// Indices for the read and write.`
			`SmallVector<Value, 4> readIndices;`
			`SmallVector<Value, 4> writeIndices;`
			`for (int r = 0; r < rank; ++r) {`
			`// Same index for read and write if the dimension is:`
			`// - the first dimension, or`
			`// - not the split axis.`
			`if (i == 0 \|\| r != axis) {`
			`readIndices.emplace_back(outputLoops.getInductionVar(r));`
			`} else {`
			`auto index = rewriter.getAffineDimExpr(0);`
			`auto indexMap = AffineMap::get(1, 0, index + splitOffset[i]);`
			`auto indexWithOffset = rewriter.create<AffineApplyOp>(loc, indexMap,`
			`ArrayRef<Value>{/index=/outputLoops.getInductionVar(r)});`
			`readIndices.emplace_back(indexWithOffset);`
			`}`
			`writeIndices.emplace_back(outputLoops.getInductionVar(r));`
			`}`
			`// Insert copy.`
Replace std.load/std.store by affine.load/affine.store (#180) * Move to more recent LLVM ID (May 15) * clang-format * Bump cache version up * Update readme * Fix doc check * Move to a newer commit id * Update LoopToStandard -> SCFToStandard * Change MLIRSideEffects to MLIRSideEffectInterfaces * Add AffineScope trait to KrnlIterateOp * [ElementWise] Load/Store op to AffineLoad/AffineStore op * [Gemm, MatMul, Reduction, Softmax] Load/Store op to AffineLoad/AffineStore op * [Concat] Load/Store op to AffineLoad/AffineStore op * [Pad, PadConstantValuePad, Reshape, Transpose] Load/Store op to AffineLoad/AffineStore op * [LSTM] Load/Store op to AffineLoad/AffineStore op * [Conv, Norm, Pooling] Load/Store op to AffineLoad/AffineStore op * Add affine-loop-fusion pass * Use Load/Store for scalar * Use Load/Store for scalar * Fix lit tests * Unknown dimensions for broadcasting ops * Affine Load/Store for scalar memref * clang-format Co-authored-by: Gheorghe-Teodor Bercea <gt.bercea@gmail.com> Co-authored-by: Tian Jin <tjingrant@gmail.com> 2020-07-05 16:20:21 +08:00			`auto loadData =`
			`rewriter.create<AffineLoadOp>(loc, operands[0], readIndices);`
			`rewriter.create<AffineStoreOp>(loc, loadData, allocs[i], writeIndices);`
Lower SplitOp to Krnl dialect (#155) * Fix importing variadic output * Lower splitop * Support unknown dimension and add lit tests Co-authored-by: Tian Jin <tjingrant@gmail.com> 2020-06-11 10:57:20 +08:00			`}`
			`rewriter.replaceOp(op, allocs);`
			`return success();`
			`}`
			`};`

			`void populateLoweringONNXSplitOpPattern(`
			`OwningRewritePatternList &patterns, MLIRContext *ctx) {`
			`patterns.insert<ONNXSplitOpLowering>(ctx);`
			`}`