torch-mlir/frontends/pytorch/csrc/init_python_bindings.cpp

//===- init_python_bindings.cpp ---------------------------------*- C++ -*-===//
//
// This file is licensed under a pytorch-style license
// See frontends/pytorch/LICENSE for license information.
//
//===----------------------------------------------------------------------===//

// This is the top-level entry point for the MLIR/NPCOMP <-> PyTorch bridge.
// It provides several mechanisms for extracting programs from PyTorch via:
//   a) A pseudo-device which captures the operations to an MLIR module
//      (implemented via the legacy type_dispatch mechanism for PyTorch 1.3).
//   b) Direct IR translation from PyTorch Graphs (not implemented).
//   c) Using the PyTorch JIT facility (not implemented).

#include "llvm/Support/Debug.h"
#include "llvm/Support/MemoryBuffer.h"
#include "llvm/Support/raw_ostream.h"

#include "mlir/Conversion/SCFToStandard/SCFToStandard.h"
#include "mlir/IR/MLIRContext.h"
#include "mlir/IR/Module.h"
#include "mlir/IR/Verifier.h"
#include "mlir/Parser.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Pass/PassManager.h"
#include "mlir/Transforms/Passes.h"

#include "npcomp/Dialect/ATen/ATenDialect.h"
#include "npcomp/Dialect/ATen/ATenOpReport.h"
#include "npcomp/Dialect/ATen/ATenPasses.h"
#include "npcomp/Dialect/ATen/LivenessReport.h"

#include "init_python_bindings.h"

#include <string>

namespace py = pybind11;
using namespace mlir;

namespace llvm {
extern bool DebugFlag;
}

namespace torch_mlir {
namespace {

mlir::OwningModuleRef LoadModule(mlir::MLIRContext &context, std::string mlir) {

  mlir::OwningModuleRef module;

  std::unique_ptr<llvm::MemoryBuffer> membuf =
      llvm::MemoryBuffer::getMemBuffer(mlir);

  llvm::SourceMgr sourceMgr;
  sourceMgr.AddNewSourceBuffer(std::move(membuf), llvm::SMLoc());
  module = mlir::parseSourceFile(sourceMgr, &context);

  if (!module) {
    llvm::errs() << "Error can't parse mlir module\n";
    return nullptr;
  }
  if (failed(mlir::verify(*module))) {
    llvm::errs() << "Error verifying MLIR module\n";
    return nullptr;
  }
  if (!module)
    return nullptr;
  return module;
}

void InitModuleBindings(py::module &m) {
  m.def(
      "_op_report",
      [](std::string mlir) -> std::string {
        mlir::MLIRContext context;
        auto module = LoadModule(context, mlir);
        mlir::PassManager pm(module->getContext());

        // our pass
        std::string report;
        pm.addPass(mlir::NPCOMP::aten::createATenLayerNamePass());
        pm.addPass(mlir::NPCOMP::aten::createATenOpReportPass(report));

        if (failed(pm.run(*module))) {
          llvm::errs() << "ATenOpReportPass failed";
          return "<error>";
        }
        return report;
      },
      "run ATenOpReportPass");

  m.def(
      "_liveness_report",
      [](std::string mlir) -> std::string {
        mlir::MLIRContext context;
        auto module = LoadModule(context, mlir);

        mlir::PassManager pm(module->getContext());

        pm.addPass(mlir::NPCOMP::aten::createATenLayerNamePass());
        if (failed(pm.run(*module))) {
          llvm::errs() << "ATen generate liveness report failed";
          return "<error>";
        }

        auto mOp = module.get();
        auto liveness = mlir::NPCOMP::aten::LivenessReport(mOp);
        std::string report = liveness.emitJSONReport();
        return report;
      },
      "generate liveness report");

  // TODO: Could this be implemented with MLIR python bindings?
  m.def(
      "lower_to_std",
      [](std::string mlir) -> std::string {
        mlir::MLIRContext context;
        auto module = LoadModule(context, mlir);

        PassManager pm0(module->getContext());
        pm0.addPass(mlir::NPCOMP::aten::createATenLoweringPass());
        pm0.addPass(mlir::NPCOMP::aten::createReturnEliminationPass());
        pm0.addPass(mlir::createCSEPass());

        if (failed(pm0.run(*module))) {
          llvm::errs() << "aten to loops conversion failed ";
          return "";
        }

        // dump MLIR to string and return
        std::string s;
        llvm::raw_string_ostream ss(s);
        ss << "# Lowered to Std\n";
        module->print(ss);
        return ss.str();
      },
      "lower aten to std dialect");

  m.def(
      "set_debug",
      [](bool b, std::string type) -> void {
        llvm::setCurrentDebugType(type.c_str());
        llvm::DebugFlag = b;
      },
      "enable/disable debug messages");
}

} // namespace

void InitBindings(py::module &m) {
  InitModuleBindings(m);

#if defined(NPCOMP_ENABLE_TORCH_TYPE_DISPATCH)
  InitTypeDispatchBindings(m);
#endif
}

} // namespace torch_mlir

PYBIND11_MODULE(_torch_mlir, m) { torch_mlir::InitBindings(m); }
Add pytorch interface to ATen Dialect (#30) This patch adds a pytorch interface to npcomp. This interface is modeled after pytorch_xla and exposes the MLIR-based flow as a virtual device (similar to a gpu device or the xla backend). Usage is intended to be something like: dev = torch_mlir.mlir_device() t0 = torch.randn((4,4), device=dev) t1 = torch.randn((4,4), device=dev) t2 = t0 + t1 t2_mlir = torch_mlir.get_mlir( t2 ) t2_cpu = t2.to('cpu') In this case t2_cpu would contain the result of the computation, and t2_mlir contains the mlir description of the computation. Note that this also properly returns backward paths synthesized by pytorch. There are several parts of this: 1) A tensor type (implemented by tensor.* and tensor_impl.) 2) The device modeling (aten_mlir_bridge., aten_mlir_device., aten_mlir_type) 3) a temporary IR (implemented by ir.cpp) There is also a reference lowering directly from the ATen dialect to C function calls consisting of two parts: 1) The driver that uses the IR to generate MLIR, run Passes and compile the result using mlir::ExecutionEngine (implemented by jit.cpp and mlir_gen.cpp) 2) A runtime library implemented by lib/aten_ops.cpp. Most of the operations are implemented by callbacks into the torch C++ libraries. Some aspects of this are known to be less than optimal, in particular: 1) There's some function definitions that don't live in the file corresponding to their declaration. 2) More aspects of this (e.g. the IR) seem like they should be automatically generated. 3) It's unclear to me how much of the 'IR' is actually necessary, or whether MLIR could be created on the fly. Note that this code is licensed in a way similar to pytorch, with the intention that eventually (when npcomp reaches some maturity) it should be pushed there. (see frontends/pytorch/LICENSE) The code is also structured much closer to the pytorch coding style than the LLVM coding style. 2020-08-22 02:22:47 +08:00			`//===- init_python_bindings.cpp ---------------------------------- C++ --===//`
			`//`
			`// This file is licensed under a pytorch-style license`
			`// See frontends/pytorch/LICENSE for license information.`
			`//`
			`//===----------------------------------------------------------------------===//`

Make code that depends on the legacy "type dispatch" mechanism optional. (#32) * Make code that depends on the legacy "type dispatch" mechanism optional. * This code is fairly tied to a specific ~1.3 version and uses a legacy dispatch mechanism. * Moving it and making it optional allows the project to build with PyTorch 1.6 and makes it possible for us to start building out a more modern interface mechanism in parallel. * Some of the moved code will be brought back into the more modern path, but isolating it now lets this be done incrementally. * Tests are left failing since the entire frontend is optional and the next step involves reworking the interface mechanism to get them to passing in both regimes. * Fix a few bogons to get things building * Add Dockerfile with pytorch Also, I configure with: -DCMAKE_PREFIX_PATH="/opt/pytorch/pytorch" (which is where pytorch is installed in this container) * Make a dep conditional. Co-authored-by: stephenneuendorffer <stephen.neuendorffer@xilinx.com> 2020-08-27 03:55:16 +08:00			`// This is the top-level entry point for the MLIR/NPCOMP <-> PyTorch bridge.`
			`// It provides several mechanisms for extracting programs from PyTorch via:`
			`// a) A pseudo-device which captures the operations to an MLIR module`
			`// (implemented via the legacy type_dispatch mechanism for PyTorch 1.3).`
			`// b) Direct IR translation from PyTorch Graphs (not implemented).`
			`// c) Using the PyTorch JIT facility (not implemented).`
Add pytorch interface to ATen Dialect (#30) This patch adds a pytorch interface to npcomp. This interface is modeled after pytorch_xla and exposes the MLIR-based flow as a virtual device (similar to a gpu device or the xla backend). Usage is intended to be something like: dev = torch_mlir.mlir_device() t0 = torch.randn((4,4), device=dev) t1 = torch.randn((4,4), device=dev) t2 = t0 + t1 t2_mlir = torch_mlir.get_mlir( t2 ) t2_cpu = t2.to('cpu') In this case t2_cpu would contain the result of the computation, and t2_mlir contains the mlir description of the computation. Note that this also properly returns backward paths synthesized by pytorch. There are several parts of this: 1) A tensor type (implemented by tensor.* and tensor_impl.) 2) The device modeling (aten_mlir_bridge., aten_mlir_device., aten_mlir_type) 3) a temporary IR (implemented by ir.cpp) There is also a reference lowering directly from the ATen dialect to C function calls consisting of two parts: 1) The driver that uses the IR to generate MLIR, run Passes and compile the result using mlir::ExecutionEngine (implemented by jit.cpp and mlir_gen.cpp) 2) A runtime library implemented by lib/aten_ops.cpp. Most of the operations are implemented by callbacks into the torch C++ libraries. Some aspects of this are known to be less than optimal, in particular: 1) There's some function definitions that don't live in the file corresponding to their declaration. 2) More aspects of this (e.g. the IR) seem like they should be automatically generated. 3) It's unclear to me how much of the 'IR' is actually necessary, or whether MLIR could be created on the fly. Note that this code is licensed in a way similar to pytorch, with the intention that eventually (when npcomp reaches some maturity) it should be pushed there. (see frontends/pytorch/LICENSE) The code is also structured much closer to the pytorch coding style than the LLVM coding style. 2020-08-22 02:22:47 +08:00
			`#include "llvm/Support/Debug.h"`
			`#include "llvm/Support/MemoryBuffer.h"`
			`#include "llvm/Support/raw_ostream.h"`

			`#include "mlir/Conversion/SCFToStandard/SCFToStandard.h"`
			`#include "mlir/IR/MLIRContext.h"`
			`#include "mlir/IR/Module.h"`
			`#include "mlir/IR/Verifier.h"`
			`#include "mlir/Parser.h"`
			`#include "mlir/Pass/Pass.h"`
			`#include "mlir/Pass/PassManager.h"`
			`#include "mlir/Transforms/Passes.h"`

			`#include "npcomp/Dialect/ATen/ATenDialect.h"`
			`#include "npcomp/Dialect/ATen/ATenOpReport.h"`
			`#include "npcomp/Dialect/ATen/ATenPasses.h"`
			`#include "npcomp/Dialect/ATen/LivenessReport.h"`

			`#include "init_python_bindings.h"`

			`#include <string>`

Make code that depends on the legacy "type dispatch" mechanism optional. (#32) * Make code that depends on the legacy "type dispatch" mechanism optional. * This code is fairly tied to a specific ~1.3 version and uses a legacy dispatch mechanism. * Moving it and making it optional allows the project to build with PyTorch 1.6 and makes it possible for us to start building out a more modern interface mechanism in parallel. * Some of the moved code will be brought back into the more modern path, but isolating it now lets this be done incrementally. * Tests are left failing since the entire frontend is optional and the next step involves reworking the interface mechanism to get them to passing in both regimes. * Fix a few bogons to get things building * Add Dockerfile with pytorch Also, I configure with: -DCMAKE_PREFIX_PATH="/opt/pytorch/pytorch" (which is where pytorch is installed in this container) * Make a dep conditional. Co-authored-by: stephenneuendorffer <stephen.neuendorffer@xilinx.com> 2020-08-27 03:55:16 +08:00			`namespace py = pybind11;`
Add pytorch interface to ATen Dialect (#30) This patch adds a pytorch interface to npcomp. This interface is modeled after pytorch_xla and exposes the MLIR-based flow as a virtual device (similar to a gpu device or the xla backend). Usage is intended to be something like: dev = torch_mlir.mlir_device() t0 = torch.randn((4,4), device=dev) t1 = torch.randn((4,4), device=dev) t2 = t0 + t1 t2_mlir = torch_mlir.get_mlir( t2 ) t2_cpu = t2.to('cpu') In this case t2_cpu would contain the result of the computation, and t2_mlir contains the mlir description of the computation. Note that this also properly returns backward paths synthesized by pytorch. There are several parts of this: 1) A tensor type (implemented by tensor.* and tensor_impl.) 2) The device modeling (aten_mlir_bridge., aten_mlir_device., aten_mlir_type) 3) a temporary IR (implemented by ir.cpp) There is also a reference lowering directly from the ATen dialect to C function calls consisting of two parts: 1) The driver that uses the IR to generate MLIR, run Passes and compile the result using mlir::ExecutionEngine (implemented by jit.cpp and mlir_gen.cpp) 2) A runtime library implemented by lib/aten_ops.cpp. Most of the operations are implemented by callbacks into the torch C++ libraries. Some aspects of this are known to be less than optimal, in particular: 1) There's some function definitions that don't live in the file corresponding to their declaration. 2) More aspects of this (e.g. the IR) seem like they should be automatically generated. 3) It's unclear to me how much of the 'IR' is actually necessary, or whether MLIR could be created on the fly. Note that this code is licensed in a way similar to pytorch, with the intention that eventually (when npcomp reaches some maturity) it should be pushed there. (see frontends/pytorch/LICENSE) The code is also structured much closer to the pytorch coding style than the LLVM coding style. 2020-08-22 02:22:47 +08:00			`using namespace mlir;`

			`namespace llvm {`
			`extern bool DebugFlag;`
			`}`

			`namespace torch_mlir {`
			`namespace {`

			`mlir::OwningModuleRef LoadModule(mlir::MLIRContext &context, std::string mlir) {`

			`mlir::OwningModuleRef module;`

			`std::unique_ptr<llvm::MemoryBuffer> membuf =`
			`llvm::MemoryBuffer::getMemBuffer(mlir);`

			`llvm::SourceMgr sourceMgr;`
			`sourceMgr.AddNewSourceBuffer(std::move(membuf), llvm::SMLoc());`
			`module = mlir::parseSourceFile(sourceMgr, &context);`

			`if (!module) {`
			`llvm::errs() << "Error can't parse mlir module\n";`
			`return nullptr;`
			`}`
			`if (failed(mlir::verify(*module))) {`
			`llvm::errs() << "Error verifying MLIR module\n";`
			`return nullptr;`
			`}`
			`if (!module)`
			`return nullptr;`
			`return module;`
			`}`

Make code that depends on the legacy "type dispatch" mechanism optional. (#32) * Make code that depends on the legacy "type dispatch" mechanism optional. * This code is fairly tied to a specific ~1.3 version and uses a legacy dispatch mechanism. * Moving it and making it optional allows the project to build with PyTorch 1.6 and makes it possible for us to start building out a more modern interface mechanism in parallel. * Some of the moved code will be brought back into the more modern path, but isolating it now lets this be done incrementally. * Tests are left failing since the entire frontend is optional and the next step involves reworking the interface mechanism to get them to passing in both regimes. * Fix a few bogons to get things building * Add Dockerfile with pytorch Also, I configure with: -DCMAKE_PREFIX_PATH="/opt/pytorch/pytorch" (which is where pytorch is installed in this container) * Make a dep conditional. Co-authored-by: stephenneuendorffer <stephen.neuendorffer@xilinx.com> 2020-08-27 03:55:16 +08:00			`void InitModuleBindings(py::module &m) {`
Add pytorch interface to ATen Dialect (#30) This patch adds a pytorch interface to npcomp. This interface is modeled after pytorch_xla and exposes the MLIR-based flow as a virtual device (similar to a gpu device or the xla backend). Usage is intended to be something like: dev = torch_mlir.mlir_device() t0 = torch.randn((4,4), device=dev) t1 = torch.randn((4,4), device=dev) t2 = t0 + t1 t2_mlir = torch_mlir.get_mlir( t2 ) t2_cpu = t2.to('cpu') In this case t2_cpu would contain the result of the computation, and t2_mlir contains the mlir description of the computation. Note that this also properly returns backward paths synthesized by pytorch. There are several parts of this: 1) A tensor type (implemented by tensor.* and tensor_impl.) 2) The device modeling (aten_mlir_bridge., aten_mlir_device., aten_mlir_type) 3) a temporary IR (implemented by ir.cpp) There is also a reference lowering directly from the ATen dialect to C function calls consisting of two parts: 1) The driver that uses the IR to generate MLIR, run Passes and compile the result using mlir::ExecutionEngine (implemented by jit.cpp and mlir_gen.cpp) 2) A runtime library implemented by lib/aten_ops.cpp. Most of the operations are implemented by callbacks into the torch C++ libraries. Some aspects of this are known to be less than optimal, in particular: 1) There's some function definitions that don't live in the file corresponding to their declaration. 2) More aspects of this (e.g. the IR) seem like they should be automatically generated. 3) It's unclear to me how much of the 'IR' is actually necessary, or whether MLIR could be created on the fly. Note that this code is licensed in a way similar to pytorch, with the intention that eventually (when npcomp reaches some maturity) it should be pushed there. (see frontends/pytorch/LICENSE) The code is also structured much closer to the pytorch coding style than the LLVM coding style. 2020-08-22 02:22:47 +08:00			`m.def(`
			`"_op_report",`
			`[](std::string mlir) -> std::string {`
			`mlir::MLIRContext context;`
			`auto module = LoadModule(context, mlir);`
			`mlir::PassManager pm(module->getContext());`

			`// our pass`
			`std::string report;`
			`pm.addPass(mlir::NPCOMP::aten::createATenLayerNamePass());`
			`pm.addPass(mlir::NPCOMP::aten::createATenOpReportPass(report));`

			`if (failed(pm.run(*module))) {`
			`llvm::errs() << "ATenOpReportPass failed";`
			`return "<error>";`
			`}`
			`return report;`
			`},`
			`"run ATenOpReportPass");`

			`m.def(`
			`"_liveness_report",`
			`[](std::string mlir) -> std::string {`
			`mlir::MLIRContext context;`
			`auto module = LoadModule(context, mlir);`

			`mlir::PassManager pm(module->getContext());`

			`pm.addPass(mlir::NPCOMP::aten::createATenLayerNamePass());`
			`if (failed(pm.run(*module))) {`
			`llvm::errs() << "ATen generate liveness report failed";`
			`return "<error>";`
			`}`

			`auto mOp = module.get();`
			`auto liveness = mlir::NPCOMP::aten::LivenessReport(mOp);`
			`std::string report = liveness.emitJSONReport();`
			`return report;`
			`},`
			`"generate liveness report");`

			`// TODO: Could this be implemented with MLIR python bindings?`
			`m.def(`
			`"lower_to_std",`
			`[](std::string mlir) -> std::string {`
			`mlir::MLIRContext context;`
			`auto module = LoadModule(context, mlir);`

			`PassManager pm0(module->getContext());`
			`pm0.addPass(mlir::NPCOMP::aten::createATenLoweringPass());`
			`pm0.addPass(mlir::NPCOMP::aten::createReturnEliminationPass());`
			`pm0.addPass(mlir::createCSEPass());`

			`if (failed(pm0.run(*module))) {`
			`llvm::errs() << "aten to loops conversion failed ";`
			`return "";`
			`}`

			`// dump MLIR to string and return`
			`std::string s;`
			`llvm::raw_string_ostream ss(s);`
			`ss << "# Lowered to Std\n";`
			`module->print(ss);`
			`return ss.str();`
			`},`
			`"lower aten to std dialect");`

			`m.def(`
			`"set_debug",`
			`[](bool b, std::string type) -> void {`
			`llvm::setCurrentDebugType(type.c_str());`
			`llvm::DebugFlag = b;`
			`},`
			`"enable/disable debug messages");`
			`}`

			`} // namespace`

Make code that depends on the legacy "type dispatch" mechanism optional. (#32) * Make code that depends on the legacy "type dispatch" mechanism optional. * This code is fairly tied to a specific ~1.3 version and uses a legacy dispatch mechanism. * Moving it and making it optional allows the project to build with PyTorch 1.6 and makes it possible for us to start building out a more modern interface mechanism in parallel. * Some of the moved code will be brought back into the more modern path, but isolating it now lets this be done incrementally. * Tests are left failing since the entire frontend is optional and the next step involves reworking the interface mechanism to get them to passing in both regimes. * Fix a few bogons to get things building * Add Dockerfile with pytorch Also, I configure with: -DCMAKE_PREFIX_PATH="/opt/pytorch/pytorch" (which is where pytorch is installed in this container) * Make a dep conditional. Co-authored-by: stephenneuendorffer <stephen.neuendorffer@xilinx.com> 2020-08-27 03:55:16 +08:00			`void InitBindings(py::module &m) {`
			`InitModuleBindings(m);`

			`#if defined(NPCOMP_ENABLE_TORCH_TYPE_DISPATCH)`
			`InitTypeDispatchBindings(m);`
			`#endif`
			`}`
Add pytorch interface to ATen Dialect (#30) This patch adds a pytorch interface to npcomp. This interface is modeled after pytorch_xla and exposes the MLIR-based flow as a virtual device (similar to a gpu device or the xla backend). Usage is intended to be something like: dev = torch_mlir.mlir_device() t0 = torch.randn((4,4), device=dev) t1 = torch.randn((4,4), device=dev) t2 = t0 + t1 t2_mlir = torch_mlir.get_mlir( t2 ) t2_cpu = t2.to('cpu') In this case t2_cpu would contain the result of the computation, and t2_mlir contains the mlir description of the computation. Note that this also properly returns backward paths synthesized by pytorch. There are several parts of this: 1) A tensor type (implemented by tensor.* and tensor_impl.) 2) The device modeling (aten_mlir_bridge., aten_mlir_device., aten_mlir_type) 3) a temporary IR (implemented by ir.cpp) There is also a reference lowering directly from the ATen dialect to C function calls consisting of two parts: 1) The driver that uses the IR to generate MLIR, run Passes and compile the result using mlir::ExecutionEngine (implemented by jit.cpp and mlir_gen.cpp) 2) A runtime library implemented by lib/aten_ops.cpp. Most of the operations are implemented by callbacks into the torch C++ libraries. Some aspects of this are known to be less than optimal, in particular: 1) There's some function definitions that don't live in the file corresponding to their declaration. 2) More aspects of this (e.g. the IR) seem like they should be automatically generated. 3) It's unclear to me how much of the 'IR' is actually necessary, or whether MLIR could be created on the fly. Note that this code is licensed in a way similar to pytorch, with the intention that eventually (when npcomp reaches some maturity) it should be pushed there. (see frontends/pytorch/LICENSE) The code is also structured much closer to the pytorch coding style than the LLVM coding style. 2020-08-22 02:22:47 +08:00
			`} // namespace torch_mlir`

			`PYBIND11_MODULE(_torch_mlir, m) { torch_mlir::InitBindings(m); }`