torch-mlir/lib/Conversion/TCFToTCP/TCFToTCP.cpp

//===----------------------------------------------------------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//

#include "npcomp/Conversion/TCFToTCP/TCFToTCP.h"

#include "../PassDetail.h"
#include "mlir/Dialect/Shape/IR/Shape.h"
#include "mlir/Dialect/Traits.h"
#include "mlir/Transforms/DialectConversion.h"
#include "npcomp/Dialect/TCF/IR/TCFOps.h"
#include "npcomp/Dialect/TCP/IR/TCPOps.h"

using namespace mlir;
using namespace mlir::NPCOMP;

namespace {
class ConvertAdd : public OpRewritePattern<tcf::AddOp> {
public:
  using OpRewritePattern::OpRewritePattern;
  LogicalResult matchAndRewrite(tcf::AddOp op,
                                PatternRewriter &rewriter) const override {
    auto lhsType = op.lhs().getType().dyn_cast<RankedTensorType>();
    auto rhsType = op.rhs().getType().dyn_cast<RankedTensorType>();
    if (!lhsType || !rhsType) {
      return rewriter.notifyMatchFailure(op, "requires ranked tensors");
    }
    Value lhsShape = rewriter.create<shape::ShapeOfOp>(op.getLoc(), op.lhs());
    Value rhsShape = rewriter.create<shape::ShapeOfOp>(op.getLoc(), op.rhs());
    Value broadcastedShape = rewriter.create<shape::BroadcastOp>(
        op.getLoc(), lhsShape, rhsShape, /*error=*/nullptr);
    Value witness =
        rewriter.create<tcp::AbortIfErrorOp>(op.getLoc(), broadcastedShape);
    tcp::IslandOp island =
        rewriter.create<tcp::IslandOp>(op.getLoc(), op.getType(), witness);
    Region &body = island.body();
    Block *bodyBlock = new Block;
    body.push_back(bodyBlock);
    OpBuilder::InsertionGuard guard(rewriter);
    rewriter.setInsertionPoint(bodyBlock, bodyBlock->begin());
    // TODO: It's annoying to do the dynamic broadcast above then
    // do the static transfer function here. Would be nice if they could
    // somehow be unified.
    SmallVector<int64_t, 6> broadcastedStaticShape;
    OpTrait::util::getBroadcastedShape(lhsType.getShape(), rhsType.getShape(),
                                       broadcastedStaticShape);
    auto resultType =
        RankedTensorType::get(broadcastedStaticShape, lhsType.getElementType());
    Value lhsBroadcasted = rewriter.create<tcp::BroadcastToOp>(
        op.getLoc(), resultType, op.lhs(), broadcastedShape);
    Value rhsBroadcasted = rewriter.create<tcp::BroadcastToOp>(
        op.getLoc(), resultType, op.rhs(), broadcastedShape);
    Value add = rewriter.create<tcp::AddOp>(op.getLoc(), op.getType(),
                                            lhsBroadcasted, rhsBroadcasted);
    rewriter.create<tcp::YieldOp>(op.getLoc(), add);

    rewriter.replaceOp(op, island.getResults());
    return success();
  }
};
}

namespace {
class ConvertTCFToTCP : public ConvertTCFToTCPBase<ConvertTCFToTCP> {
public:
  void runOnOperation() {
    ModuleOp module = getOperation();
    MLIRContext *context = &getContext();

    OwningRewritePatternList patterns;
    patterns.insert<ConvertAdd>(context);
    (void)applyPatternsAndFoldGreedily(module, patterns);
  }
};
} // namespace

std::unique_ptr<OperationPass<ModuleOp>>
mlir::NPCOMP::createConvertTCFToTCPPass() {
  return std::make_unique<ConvertTCFToTCP>();
}
Initial TCF/TCP E2E seed. Very much WIP. This is enough to get tcf.add down to approximately the "linalg.generic on buffers" level of abstraction. (but there are nuances) 2020-05-07 09:41:54 +08:00			`//===----------------------------------------------------------------------===//`
			`//`
			`// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
			`// See https://llvm.org/LICENSE.txt for license information.`
			`// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`
			`//`
			`//===----------------------------------------------------------------------===//`

			`#include "npcomp/Conversion/TCFToTCP/TCFToTCP.h"`

			`#include "../PassDetail.h"`
			`#include "mlir/Dialect/Shape/IR/Shape.h"`
			`#include "mlir/Dialect/Traits.h"`
			`#include "mlir/Transforms/DialectConversion.h"`
			`#include "npcomp/Dialect/TCF/IR/TCFOps.h"`
			`#include "npcomp/Dialect/TCP/IR/TCPOps.h"`

			`using namespace mlir;`
			`using namespace mlir::NPCOMP;`

			`namespace {`
			`class ConvertAdd : public OpRewritePattern<tcf::AddOp> {`
			`public:`
			`using OpRewritePattern::OpRewritePattern;`
			`LogicalResult matchAndRewrite(tcf::AddOp op,`
			`PatternRewriter &rewriter) const override {`
			`auto lhsType = op.lhs().getType().dyn_cast<RankedTensorType>();`
			`auto rhsType = op.rhs().getType().dyn_cast<RankedTensorType>();`
			`if (!lhsType \|\| !rhsType) {`
			`return rewriter.notifyMatchFailure(op, "requires ranked tensors");`
			`}`
			`Value lhsShape = rewriter.create<shape::ShapeOfOp>(op.getLoc(), op.lhs());`
			`Value rhsShape = rewriter.create<shape::ShapeOfOp>(op.getLoc(), op.rhs());`
			`Value broadcastedShape = rewriter.create<shape::BroadcastOp>(`
			`op.getLoc(), lhsShape, rhsShape, /error=/nullptr);`
			`Value witness =`
			`rewriter.create<tcp::AbortIfErrorOp>(op.getLoc(), broadcastedShape);`
			`tcp::IslandOp island =`
			`rewriter.create<tcp::IslandOp>(op.getLoc(), op.getType(), witness);`
			`Region &body = island.body();`
			`Block *bodyBlock = new Block;`
			`body.push_back(bodyBlock);`
			`OpBuilder::InsertionGuard guard(rewriter);`
			`rewriter.setInsertionPoint(bodyBlock, bodyBlock->begin());`
			`// TODO: It's annoying to do the dynamic broadcast above then`
			`// do the static transfer function here. Would be nice if they could`
			`// somehow be unified.`
			`SmallVector<int64_t, 6> broadcastedStaticShape;`
			`OpTrait::util::getBroadcastedShape(lhsType.getShape(), rhsType.getShape(),`
			`broadcastedStaticShape);`
			`auto resultType =`
			`RankedTensorType::get(broadcastedStaticShape, lhsType.getElementType());`
			`Value lhsBroadcasted = rewriter.create<tcp::BroadcastToOp>(`
			`op.getLoc(), resultType, op.lhs(), broadcastedShape);`
			`Value rhsBroadcasted = rewriter.create<tcp::BroadcastToOp>(`
			`op.getLoc(), resultType, op.rhs(), broadcastedShape);`
			`Value add = rewriter.create<tcp::AddOp>(op.getLoc(), op.getType(),`
			`lhsBroadcasted, rhsBroadcasted);`
			`rewriter.create<tcp::YieldOp>(op.getLoc(), add);`

			`rewriter.replaceOp(op, island.getResults());`
			`return success();`
			`}`
			`};`
			`}`

			`namespace {`
			`class ConvertTCFToTCP : public ConvertTCFToTCPBase<ConvertTCFToTCP> {`
			`public:`
			`void runOnOperation() {`
			`ModuleOp module = getOperation();`
			`MLIRContext *context = &getContext();`

			`OwningRewritePatternList patterns;`
			`patterns.insert<ConvertAdd>(context);`
			`(void)applyPatternsAndFoldGreedily(module, patterns);`
			`}`
			`};`
			`} // namespace`

			`std::unique_ptr<OperationPass<ModuleOp>>`
			`mlir::NPCOMP::createConvertTCFToTCPPass() {`
			`return std::make_unique<ConvertTCFToTCP>();`
			`}`