[MLIR] Fix shape inference and enable ONNF to read in MLIR files. (#367)

* Fix inference. Enable ONNF to read in MLIR files. * Fix input of onnx or mlir models. * Address comments.
2019-11-15 13:10:41 -05:00 · 2019-11-15 13:10:41 -05:00 · dc36fd416b
parent 0d644fab92
commit dc36fd416b
3 changed files with 72 additions and 7 deletions
--- a/src/compiler/dialect/onnx/onnx_ops.cpp
+++ b/src/compiler/dialect/onnx/onnx_ops.cpp
@ -51,9 +51,14 @@ void ONNXAddOp::inferShapes() {
 // MatMul

 void ONNXMatMulOp::inferShapes() {
+  // Cannot infer shape if no shape exists.
+  if (!getOperand(0)->getType().isa<RankedTensorType>() ||
+      !getOperand(1)->getType().isa<RankedTensorType>())
+    return;
  auto lhsTy = getOperand(0)->getType().cast<RankedTensorType>();
  auto rhsTy = getOperand(1)->getType().cast<RankedTensorType>();
-  SmallVector<int64_t, 2> dims(lhsTy.getShape()[0]);
+  SmallVector<int64_t, 2> dims;
+  dims.emplace_back(lhsTy.getShape()[0]);
  dims.emplace_back(rhsTy.getShape()[1]);
  getResult()->setType(RankedTensorType::get(dims, lhsTy.getElementType()));
 }
@ -67,9 +72,14 @@ void ONNXMatMulOp::inferShapes() {
 // Gemm

 void ONNXGemmOp::inferShapes() {
+  // Cannot infer shape if no shape exists.
+  if (!getOperand(0)->getType().isa<RankedTensorType>() ||
+      !getOperand(1)->getType().isa<RankedTensorType>())
+    return;
  auto lhsTy = getOperand(0)->getType().cast<RankedTensorType>();
  auto rhsTy = getOperand(1)->getType().cast<RankedTensorType>();
-  SmallVector<int64_t, 2> dims(lhsTy.getShape()[0]);
+  SmallVector<int64_t, 2> dims;
+  dims.emplace_back(lhsTy.getShape()[0]);
  dims.emplace_back(rhsTy.getShape()[1]);
  getResult()->setType(RankedTensorType::get(dims, lhsTy.getElementType()));
 }
@ -77,9 +87,14 @@ void ONNXGemmOp::inferShapes() {
 // FullGemm

 void ONNXFullGemmOp::inferShapes() {
+  // Cannot infer shape if no shape exists.
+  if (!getOperand(0)->getType().isa<RankedTensorType>() ||
+      !getOperand(1)->getType().isa<RankedTensorType>())
+    return;
  auto lhsTy = getOperand(0)->getType().cast<RankedTensorType>();
  auto rhsTy = getOperand(1)->getType().cast<RankedTensorType>();
-  SmallVector<int64_t, 2> dims(lhsTy.getShape()[0]);
+  SmallVector<int64_t, 2> dims;
+  dims.emplace_back(lhsTy.getShape()[0]);
  dims.emplace_back(rhsTy.getShape()[1]);
  getResult()->setType(RankedTensorType::get(dims, lhsTy.getElementType()));
 }
--- a/src/compiler/pass/shape_inference_pass.cpp
+++ b/src/compiler/pass/shape_inference_pass.cpp
@ -13,8 +13,8 @@
 #include "llvm/Support/raw_ostream.h"
 #include "mlir/Pass/Pass.h"

-#include "src/compiler/dialect/onnx/onnx_ops.hpp"
 #include "shape_inference_interface.hpp"
+#include "src/compiler/dialect/onnx/onnx_ops.hpp"

 #include "passes.hpp"

@ -82,7 +82,10 @@ class ShapeInferencePass : public mlir::FunctionPass<ShapeInferencePass> {
    // All operations which do not return a ranked tensor type have dynamic
    // shaped outputs. All those operation need to implement the inferShape()
    // method.
-    if (op->getName().getStringRef() != "onnx.add")
+    if (op->getName().getStringRef() != "onnx.add" &&
+        op->getName().getStringRef() != "onnx.matmul" &&
+        op->getName().getStringRef() != "onnx.gemm" &&
+        op->getName().getStringRef() != "onnx.full_gemm")
      return false;
    return llvm::any_of(op->getResultTypes(),
        [](Type result_type) { return !result_type.isa<RankedTensorType>(); });
--- a/src/main.cpp
+++ b/src/main.cpp
@ -28,6 +28,10 @@

 #include <boost/program_options.hpp>

+#include "llvm/Support/FileUtilities.h"
+#include "llvm/Support/Regex.h"
+#include "llvm/Support/SourceMgr.h"
+
 #include "src/builder/frontend_dialect_transformer.hpp"
 #include "src/compiler/dialect/krnl/krnl_ops.hpp"
 #include "src/compiler/dialect/onnx/onnx_ops.hpp"
@ -47,6 +51,28 @@
 using namespace std;
 using namespace onnf;

+void LoadMLIR(string inputFilename, mlir::MLIRContext& context,
+    mlir::OwningModuleRef& module) {
+  // Handle '.mlir' input to the DLC compiler.
+  // The mlir format indicates that one or more of the supported
+  // representations are used in the file.
+  llvm::ErrorOr<std::unique_ptr<llvm::MemoryBuffer>> fileOrErr =
+      llvm::MemoryBuffer::getFileOrSTDIN(inputFilename);
+  if (std::error_code EC = fileOrErr.getError()) {
+    llvm::errs() << "Could not open input file: " << EC.message() << "\n";
+    return;
+  }
+
+  // Parse the input mlir.
+  llvm::SourceMgr sourceMgr;
+  sourceMgr.AddNewSourceBuffer(std::move(*fileOrErr), llvm::SMLoc());
+  module = mlir::parseSourceFile(sourceMgr, &context);
+  if (!module) {
+    llvm::errs() << "Error can't load file " << inputFilename << "\n";
+    return;
+  }
+}
+
 int main(int ac, char* av[]) {
  namespace po = boost::program_options;

@ -57,8 +83,16 @@ int main(int ac, char* av[]) {
        "onnx model file");
  // clang-format on

+  // Handle command line argument with option names and positional
+  // command line arguments.
+  po::positional_options_description p;
+  p.add("onnx-model", -1);
  po::variables_map vm;
-  po::store(po::parse_command_line(ac, av, desc), vm);
+  po::store(
+      po::command_line_parser(ac, av).options(desc).positional(p).run(), vm);
+
+  // TODO: allow multiple input files
+  assert(vm.count("onnx-model") < 2 && "At most one input file can be provided!");

  if (vm.count("help")) {
    cout << desc << endl;
@ -71,8 +105,21 @@ int main(int ac, char* av[]) {
  mlir::MLIRContext context;
  mlir::OwningModuleRef module;

+  // Decide if the input file is an ONNX model or a model specified
+  // in MLIR. The extension of the file is the decider.
  string model_filename = vm["onnx-model"].as<string>();
+  string extension =
+      model_filename.substr(model_filename.find_last_of(".") + 1);
+  bool onnx_model_provided = (extension == "onnx");
+  bool mlir_model_provided = (extension == "mlir");
+
+  if (onnx_model_provided) {
    ImportFrontendModelFile(model_filename, context, module);
+  } else if (mlir_model_provided) {
+    LoadMLIR(model_filename, context, module);
+  } else {
+    assert(false && "No ONNX or MLIR models provided!");
+  }

  mlir::PassManager pm(&context);
  pm.addPass(mlir::createShapeInferencePass());