//===------------------------------------------------------------*- C++ -*-===// // // This file is licensed under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // Also available under a BSD-style license. See LICENSE. // //===----------------------------------------------------------------------===// #include "mlir/IR/DialectResourceBlobManager.h" #include "torch-mlir/Conversion/TorchOnnxToTorch/Patterns.h" #include "torch-mlir/Conversion/TorchOnnxToTorch/Utils.h" #include "torch-mlir/Dialect/Torch/IR/TorchOps.h" #include "torch-mlir/Dialect/Torch/Utils/Utils.h" #include "llvm/Support/FormatVariadic.h" #include using namespace mlir; using namespace mlir::torch; using namespace mlir::torch::onnx_c; namespace { LogicalResult windowFunctionImpl(OpBinder binder, ConversionPatternRewriter &rewriter, Value size, Value a0, Value a1, Value a2, Torch::ValueTensorType resultType, int64_t output_datatype, int64_t periodic) { Location loc = binder.getLoc(); ImplicitLocOpBuilder b(loc, rewriter); double isPeriodicFp = static_cast(periodic); Value zero = b.create(rewriter.getF64FloatAttr(0.0)); Value one = b.create(rewriter.getF64FloatAttr(1.0)); Value two = b.create(rewriter.getF64FloatAttr(2.0)); constexpr double pi = llvm::numbers::pi; Value tau = b.create( rewriter.getFloatAttr(rewriter.getF64Type(), 2.0 * pi)); Value noneVal = b.create(); Value cstFalse = b.create(false); Value float32Type = b.create( rewriter.getI64IntegerAttr(/*float32Type*/ 6)); // Create an f32 ValueTensorType with thse same size as size, the // operand auto shapeOfOperand = dyn_cast(size.getType()).getOptionalSizes(); auto f32ResultType = rewriter.getType( shapeOfOperand, rewriter.getF32Type()); Value periodicSizeFloat = b.create( f32ResultType, size, float32Type, cstFalse, cstFalse, noneVal); Value symmetricSizeFloat = b.create( periodicSizeFloat.getType(), periodicSizeFloat, one, one); Value isPeriodic = b.create(rewriter.getF64FloatAttr(isPeriodicFp)); Value isSymmetricFloat = b.create( rewriter.getF64FloatAttr(1.0 - isPeriodicFp)); Value periodicComponent = b.create( periodicSizeFloat.getType(), periodicSizeFloat, isPeriodic); Value symmetricComponent = b.create( symmetricSizeFloat.getType(), symmetricSizeFloat, isSymmetricFloat); Value sizeFloat = b.create( symmetricComponent.getType(), symmetricComponent, periodicComponent, one); // Here, size can be used in the place of periodicSizeFloat, as the // latter is just a float representation of the former. Value scalarLimit = getItemOp(binder, rewriter, size); Value rangeArr = b.create( resultType, zero, scalarLimit, one, noneVal, noneVal, noneVal, noneVal); Value rangeTimesTau = b.create(resultType, rangeArr, tau); Value rangeAngular = b.create(resultType, rangeTimesTau, sizeFloat); Value twoRangeAngular = b.create(resultType, rangeAngular, two); Value cosRangeAngular = b.create(resultType, rangeAngular); Value cosTwoRangeAngular = b.create(resultType, twoRangeAngular); Value a1Component = b.create(resultType, cosRangeAngular, a1); Value a2Component = b.create(resultType, cosTwoRangeAngular, a2); // AtenSubScalarOp actually requires a tensor operand as the LHS, that // is, operand #1. Therefore, to avoid errors, the onnx implementation // has been modified. a1 has been changed to negative half, and the // AtenSubScalarOp has been replaced with AtenAddScalarOp, as the add // operation is commutative. Value subA1Component = b.create(resultType, a1Component, a0, one); Value result = b.create(resultType, subA1Component, a2Component, one); std::optional dtypeIntTorch = onnxDtypeIntToTorchDtypeInt(output_datatype); if (!dtypeIntTorch.has_value()) { return rewriter.notifyMatchFailure( binder.op, "unimplemented support for the given dtype conversion"); } Value outputDtype = b.create( rewriter.getType(), rewriter.getIntegerAttr(rewriter.getIntegerType(64), dtypeIntTorch.value())); rewriter.replaceOpWithNewOp( binder.op, resultType, result, outputDtype, /*non_blocking=*/cstFalse, /*copy=*/cstFalse, /*memory_format=*/noneVal); return success(); } } // namespace // Simple rewrites for the default domain. // See: https://onnx.ai/onnx/operators/ // For operators that are effectively version invariant, we register with // sinceVersion==1. We interpret this to include the following spec // diffs that are irrelevant to this level of lowering: // * Supported element types. // * Limited broadcasting to full broadcasting support. // // There are a lot of spec revisions that basically generalized elementwise // to be more normal and a direct translation vs a special case. This // results in a lot of ONNX test cases that all reduce to the exact same // thing here, so we simplify. void mlir::torch::onnx_c::populateDefaultDomainAtoF( OnnxCustomOpConversionPattern &patterns) { patterns.onOp("Abs", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); // Add became forward compatible with Torch in version 7. patterns.onOp("Add", 7, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType)) return failure(); Value const1 = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getIntegerAttr(rewriter.getIntegerType(64), 1)); rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs, const1); return success(); }); // TODO: AffineGrid patterns.onOp("And", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); return success(); }); patterns.onOp( "ArgMax", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; bool keepDims; int64_t axis; bool selectLastIndex; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType) || binder.s64BoolAttr(keepDims, "keepdims", true) || binder.s64IntegerAttr(axis, "axis", 0) || binder.s64BoolAttr(selectLastIndex, "select_last_index", false)) return failure(); // ONNX allows negative axis. auto operandSizes = cast(operand.getType()).getSizes(); if (axis < 0) axis += operandSizes.size(); Value constAxis = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getIntegerAttr(rewriter.getIntegerType(64), axis)); Value constKeepDims = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getBoolAttr(keepDims)); if (selectLastIndex) { Value dims = createConstantIntList(binder, rewriter, {axis}); auto operandTy = dyn_cast(operand.getType()); operand = rewriter.create( binder.getLoc(), operandTy, operand, dims); Value argmax = rewriter.create( binder.getLoc(), resultType, operand, constAxis, constKeepDims); Value offset = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(operandSizes[axis] - 1)); Value alpha = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1)); Value sub = rewriter.create( binder.getLoc(), resultType, argmax, offset, alpha); rewriter.replaceOpWithNewOp(binder.op, resultType, sub); return success(); } rewriter.replaceOpWithNewOp( binder.op, resultType, operand, constAxis, constKeepDims); return success(); }); patterns.onOp( "ArgMin", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; bool keepDims; int64_t axis; bool selectLastIndex; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType) || binder.s64BoolAttr(keepDims, "keepdims", true) || binder.s64IntegerAttr(axis, "axis", 0) || binder.s64BoolAttr(selectLastIndex, "select_last_index", false)) return failure(); // ONNX allows negative axis. auto operandSizes = cast(operand.getType()).getSizes(); if (axis < 0) axis += operandSizes.size(); Value constAxis = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getIntegerAttr(rewriter.getIntegerType(64), axis)); Value constKeepDims = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getBoolAttr(keepDims)); if (selectLastIndex) { Value dims = createConstantIntList(binder, rewriter, {axis}); auto operandTy = dyn_cast(operand.getType()); operand = rewriter.create( binder.getLoc(), operandTy, operand, dims); Value argmin = rewriter.create( binder.getLoc(), resultType, operand, constAxis, constKeepDims); Value offset = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(operandSizes[axis] - 1)); Value alpha = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1)); Value sub = rewriter.create( binder.getLoc(), resultType, argmin, offset, alpha); rewriter.replaceOpWithNewOp(binder.op, resultType, sub); return success(); } rewriter.replaceOpWithNewOp( binder.op, resultType, operand, constAxis, constKeepDims); return success(); }); patterns.onOp("Asin", 7, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Asinh", 9, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Atan", 7, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Atanh", 9, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Acos", 7, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Acosh", 9, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp( "BatchNormalization", 15, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input, weight, bias, inputMean, inputVar; bool training; float momentum, eps; if (binder.tensorOperandAtIndex(input, 0) || binder.tensorOperandAtIndex(weight, 1) || binder.tensorOperandAtIndex(bias, 2) || binder.tensorOperandAtIndex(inputMean, 3) || binder.tensorOperandAtIndex(inputVar, 4) || binder.f32FloatAttr(momentum, "momentum", 0.9f) || binder.f32FloatAttr(eps, "epsilon", 1e-05f) || binder.s64BoolAttr(training, "training_mode", 0) || binder.tensorResultTypeAtIndex(resultType, 0)) return failure(); Location loc = binder.getLoc(); Value cstFalse = rewriter.create(loc, false); Value cstMomentum = rewriter.create( loc, rewriter.getF64FloatAttr(momentum)); Value cstEps = rewriter.create( loc, rewriter.getF64FloatAttr(eps)); // When training_mode=False, the op outputs only Y, where // Y = (X - input_mean) / sqrt(input_var + epsilon) * scale + // B if (!training) { rewriter.replaceOpWithNewOp( binder.op, resultType, input, weight, bias, inputMean, inputVar, /*training=*/cstFalse, cstMomentum, cstEps, /*cudnn_enabled=*/cstFalse); return success(); } Torch::ValueTensorType meanResultType, varResultType; if (binder.tensorResultTypeAtIndex(meanResultType, 1) || binder.tensorResultTypeAtIndex(varResultType, 2)) return failure(); // When training_mode=True, the outputs are as follows: // Y, running_mean, running_var. // Y = (X - current_mean) / sqrt(current_var + epsilon) * // scale + B // running_mean = input_mean * momentum + current_mean * (1 - // momentum) // running_var = input_var * momentum + current_var * (1 - // momentum) // and // current_mean = ReduceMean(X, axis=all_except_channel_index) // current_var = ReduceVar(X, axis=all_except_channel_index) Torch::ValueTensorType inputType = cast(input.getType()); if (!inputType.hasSizes()) return rewriter.notifyMatchFailure( binder.op, "unimplemented: expected input to have sizes"); // Computing current_mean and current_var. int64_t inputRank = inputType.getSizes().size(); // Reduce all dimensions except channel dim. SmallVector dimsToReduce; for (int64_t i = 0; i < inputRank; i++) { if (i != 1) dimsToReduce.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } Value reduceDimsList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), dimsToReduce); Value noneVal = rewriter.create(binder.getLoc()); Value currentMean = rewriter.create( loc, meanResultType, input, reduceDimsList, /*keepdim=*/cstFalse, /*dtype=*/noneVal); Value currentVar = rewriter.create( loc, varResultType, input, reduceDimsList, /*unbiased=*/cstFalse, /*keepdim=*/cstFalse); // Computing running_mean. Value inputMeanMulMomentum = rewriter.create( loc, meanResultType, inputMean, cstMomentum); Value currentMeanMulMomentum = rewriter.create( loc, varResultType, currentMean, cstMomentum); Value constantOne = rewriter.create( loc, rewriter.getI64IntegerAttr(1)); Value inpMeanMMSubCurMeanMM = rewriter.create( loc, meanResultType, inputMeanMulMomentum, currentMeanMulMomentum, constantOne); Value runningMean = rewriter.create( loc, meanResultType, inpMeanMMSubCurMeanMM, currentMean, constantOne); // Computing running_var. Value inputVarMulMomentum = rewriter.create( loc, varResultType, inputVar, cstMomentum); Value currentVarMulMomentum = rewriter.create( loc, varResultType, currentVar, cstMomentum); Value inpVarMMSubCurVarMM = rewriter.create( loc, varResultType, inputVarMulMomentum, currentVarMulMomentum, constantOne); Value runningVar = rewriter.create( loc, varResultType, inpVarMMSubCurVarMM, currentVar, constantOne); // Computing Y. Value y = rewriter.create( loc, resultType, input, weight, bias, currentMean, currentVar, /*training=*/cstFalse, cstMomentum, cstEps, /*cudnn_enabled=*/cstFalse); rewriter.replaceOp(binder.op, {y, runningMean, runningVar}); return success(); }); patterns.onOp( "AveragePool", 11, [](OpBinder binder, ConversionPatternRewriter &rewriter) { std::string autoPad; SmallVector dilations; if (binder.customOpNameStringAttr(autoPad, "auto_pad", "NOTSET")) return failure(); if (autoPad != "NOTSET") { // TODO: Add support for `auto_pad` != "NOTSET" return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: auto_pad != NOTSET"); } Torch::ValueTensorType resultType; Value operand; bool ceilMode, countIncludePad; if (binder.tensorOperand(operand) || binder.s64BoolAttr(ceilMode, "ceil_mode", false) || binder.s64BoolAttr(countIncludePad, "count_include_pad", false) || binder.tensorResultType(resultType)) return failure(); // Determine the rank of input tensor. std::optional maybeRank = Torch::getTensorRank(operand); if (!maybeRank) return rewriter.notifyMatchFailure(binder.op, "Unimplemented: unranked tensor"); unsigned rank = *maybeRank; SmallVector kernel, padding, strides; if (binder.s64IntegerArrayAttr(kernel, "kernel_shape", {})) { return failure(); } if (kernel.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "kernel list size does not match the number of axes"); } SmallVector defaultPadding(2 * (rank - 2), 0); if (binder.s64IntegerArrayAttr(padding, "pads", defaultPadding)) { return failure(); } if (padding.size() != 2 * (rank - 2)) { return rewriter.notifyMatchFailure( binder.op, "padding list size does not match twice the number of axes"); } if (binder.s64IntegerArrayAttr( strides, "strides", llvm::SmallVector(rank - 2, 1))) { return failure(); } if (strides.size() != 1 && strides.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "strides list size does not match the number of axes"); } SmallVector cstKernel, cstPadding, cstStridesDilations; for (int64_t i : kernel) { cstKernel.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } // Onnx pads format: [x1_begin, x2_begin…x1_end, x2_end,…] // Pytorch pads format: [x1, x2,...] or [x], assume begin==end for all // axes x. int64_t paddingSizeHalf = padding.size() / 2; for (int64_t i = 0; i < paddingSizeHalf; ++i) { // Check if onnx padding attribute is symmetric. if (padding[i] != padding[i + paddingSizeHalf]) return rewriter.notifyMatchFailure( binder.op, "onnx padding attribute is not symmetric"); cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(padding[i]))); } for (int64_t i : strides) { cstStridesDilations.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } // No dilations attribute in pytorch avgpool op, so use this trick to // encode dilation into strides. Then in the following torchtolinalg // lowering, decode strides into strides + dilation. // [strideDim1,strideDim2,...,dilationDim1,dilationDim2,...] if (binder.s64IntegerArrayAttr( dilations, "dilations", llvm::SmallVector(rank - 2, 1))) { return failure(); } for (auto dilation : dilations) { cstStridesDilations.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(dilation))); } Value kernelSizeList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstKernel); Value paddingList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstPadding); Value stridesDilationsList = rewriter.create( binder.getLoc(), Torch::ListType::get( Torch::IntType::get(binder.op->getContext())), cstStridesDilations); Value cstCeilMode = rewriter.create(binder.getLoc(), ceilMode); Value cstCountIncludePad = rewriter.create( binder.getLoc(), countIncludePad); Value cstNone = rewriter.create(binder.getLoc()); if (rank == 3) { rewriter.replaceOpWithNewOp( binder.op, resultType, operand, kernelSizeList, stridesDilationsList, paddingList, cstCeilMode, cstCountIncludePad); return success(); } else if (rank == 4) { rewriter.replaceOpWithNewOp( binder.op, resultType, operand, kernelSizeList, stridesDilationsList, paddingList, cstCeilMode, cstCountIncludePad, /*divisor_override=*/cstNone); return success(); } else if (rank == 5) { rewriter.replaceOpWithNewOp( binder.op, resultType, operand, kernelSizeList, stridesDilationsList, paddingList, cstCeilMode, cstCountIncludePad, /*divisor_override=*/cstNone); return success(); } return failure(); }); patterns.onOp( "Bernoulli", 15, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input; int64_t dtypeIntOnnx; if (binder.tensorOperand(input) || binder.s64IntegerAttr(dtypeIntOnnx, "dtype", -1) || binder.tensorResultType(resultType)) return failure(); SmallString<64> name("torch.onnx."); name.append("seed"); auto attr = binder.op->getAttr(name); if (attr) { return rewriter.notifyMatchFailure( binder.op, "unimplemented: support not present for seed attribute"); } Value none = rewriter.create(binder.getLoc()); Value bernoulli = rewriter.create( binder.getLoc(), input.getType(), input, /*generator=*/none); if (dtypeIntOnnx == -1) { // True, if dtype attribute value is not present. rewriter.replaceOp(binder.op, bernoulli); return success(); } std::optional dtypeIntTorch = onnxDtypeIntToTorchDtypeInt(dtypeIntOnnx); if (!dtypeIntTorch.has_value()) { return rewriter.notifyMatchFailure( binder.op, "unimplemented support for the given dtype conversion"); } Value constDtype = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(dtypeIntTorch.value())); Value cstFalse = rewriter.create(binder.getLoc(), false); rewriter.replaceOpWithNewOp( binder.op, resultType, bernoulli, constDtype, /*non_blocking=*/cstFalse, /*copy=*/cstFalse, /*memory_format=*/none); return success(); }); patterns.onOp( "BitShift", 11, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; std::string direction; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType) || binder.customOpNameStringAttr(direction, "direction", "")) return failure(); if (direction == "LEFT") { rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); } else { rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); } return success(); }); patterns.onOp("BitwiseAnd", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; std::string direction; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); return success(); }); patterns.onOp("BitwiseOr", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; std::string direction; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); return success(); }); patterns.onOp("BitwiseNot", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("BitwiseXor", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value lhs, rhs; std::string direction; if (binder.tensorOperands(lhs, rhs) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, lhs, rhs); return success(); }); patterns.onOp( "Cast", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; int64_t dtypeIntOnnx; if (binder.tensorOperand(operand) || binder.s64IntegerAttr(dtypeIntOnnx, "to") || binder.tensorResultType(resultType)) return failure(); std::optional dtypeIntTorch = onnxDtypeIntToTorchDtypeInt(dtypeIntOnnx); if (!dtypeIntTorch.has_value()) { return rewriter.notifyMatchFailure( binder.op, "unimplemented support for the given dtype conversion"); } Value constDtype = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(dtypeIntTorch.value())); Value none = rewriter.create(binder.getLoc()); Value cstFalse = rewriter.create(binder.getLoc(), false); rewriter.replaceOpWithNewOp( binder.op, resultType, operand, constDtype, /*non_blocking=*/cstFalse, /*copy=*/cstFalse, /*memory_format=*/none); return success(); }); patterns.onOp( "CastLike", 15, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input, target; if (binder.tensorOperands(input, target) || binder.tensorResultType(resultType)) return failure(); // TODO: Add support to handle the `saturate` attribute. // Ignoring it right now, since it's only using during the float8 // conversions which are not supported in Torch-MLIR right now. Torch::ValueTensorType targetTy = cast(target.getType()); if (!targetTy.hasDtype()) { return rewriter.notifyMatchFailure(binder.op, "target tensor must have a dtype"); } Type targetDtype = targetTy.getDtype(); Value constDtype = Torch::getDtypeIntValueForType( rewriter, binder.getLoc(), targetDtype); Value none = rewriter.create(binder.getLoc()); Value cstFalse = rewriter.create(binder.getLoc(), false); rewriter.replaceOpWithNewOp( binder.op, resultType, input, constDtype, /*non_blocking=*/cstFalse, /*copy=*/cstFalse, /*memory_format=*/none); return success(); }); patterns.onOp("Ceil", 13, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp( "Celu", 12, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; float alpha; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType) || binder.f32FloatAttr(alpha, "alpha", 1.0f)) return failure(); // exp(x/alpha) Value constAlpha = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getF64FloatAttr(alpha)); Value xDivAlpha = rewriter.create( binder.getLoc(), resultType, operand, constAlpha); Value expXDivAlpha = rewriter.create( binder.getLoc(), resultType, xDivAlpha); // alpha * (exp(x/alpha) - 1) Value constantOne = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1)); Value subOne = rewriter.create( binder.getLoc(), resultType, expXDivAlpha, constantOne, constantOne); Value mulAlpha = rewriter.create( binder.getLoc(), resultType, subOne, constAlpha); Value constantZero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); Value zeroTensor = createRank0Tensor(rewriter, binder.getLoc(), resultType, constantZero); // min(0, alpha * (exp(x/alpha) - 1)) Value minExpression = rewriter.create( binder.getLoc(), resultType, zeroTensor, mulAlpha); // max(0, x) Value maxExpression = rewriter.create( binder.getLoc(), resultType, zeroTensor, operand); // max(0,x) + min(0, alpha * (exp(x/alpha) - 1)) rewriter.replaceOpWithNewOp( binder.op, resultType, maxExpression, minExpression, constantOne); return success(); }); patterns.onOp( "CenterCropPad", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input, shape; if (binder.tensorOperands(input, shape) || binder.tensorResultType(resultType)) return failure(); auto inputTy = cast(input.getType()); SmallVector inputShape(inputTy.getSizes()); SmallVector resultShape(resultType.getSizes()); int64_t rank = inputShape.size(); SmallVector axes, defaultAxes(rank); std::iota(defaultAxes.begin(), defaultAxes.end(), 0); if (binder.s64IntegerArrayAttr(axes, "axes", defaultAxes)) { return failure(); } int64_t axesSize = axes.size(); Value none = rewriter.create(binder.getLoc()); Value cstZero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); Value cstOne = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1)); Value cstTwo = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(2)); auto scalarTensorType = rewriter.getType( ArrayRef{}, rewriter.getIntegerType(64, /*signed*/ 1)); auto selectTensorType = rewriter.getType( ArrayRef{1}, rewriter.getIntegerType(64, /*signed*/ 1)); int64_t lastChangeDim = 0; llvm::SmallVector interShape(inputShape); for (int i = 0; i < rank; i++) { if (inputShape[i] != resultShape[i]) { interShape[i] = -1; lastChangeDim = i; } if (interShape[i] == ShapedType::kDynamic) interShape[i] = Torch::kUnknownSize; } auto interType = rewriter.getType( interShape, resultType.getOptionalDtype()); Value modeVal = rewriter.create( binder.getLoc(), rewriter.getStringAttr("floor")); for (int i = 0; i < axesSize; i++) { if (axes[i] < 0) axes[i] += rank; if (inputShape[axes[i]] == resultShape[axes[i]]) continue; auto opType = axes[i] == lastChangeDim ? resultType : interType; Value axis = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(axes[i])); Value k = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i)); Value kTensor = rewriter.create( binder.getLoc(), scalarTensorType, k); Value sel = rewriter.create( binder.getLoc(), selectTensorType, shape, cstZero, kTensor); Value outputDimSize = rewriter.create( binder.getLoc(), rewriter.getType(), sel); Value inputDimSize = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(axes[i]))); if (inputShape[axes[i]] > resultShape[axes[i]]) { Value sub = rewriter.create( binder.getLoc(), inputDimSize, outputDimSize); Value subTensor = rewriter.create( binder.getLoc(), scalarTensorType, sub); Value div = rewriter.create( binder.getLoc(), scalarTensorType, subTensor, cstTwo, modeVal); Value start = rewriter.create( binder.getLoc(), rewriter.getType(), div); Value end = rewriter.create( binder.getLoc(), start, outputDimSize); input = rewriter.create( binder.getLoc(), opType, input, axis, start, end, cstOne); } else { Value sub = rewriter.create( binder.getLoc(), outputDimSize, inputDimSize); Value subTensor = rewriter.create( binder.getLoc(), scalarTensorType, sub); Value div = rewriter.create( binder.getLoc(), scalarTensorType, subTensor, cstTwo, modeVal); Value start = rewriter.create( binder.getLoc(), rewriter.getType(), div); Value end = rewriter.create( binder.getLoc(), start, inputDimSize); SmallVector zerosShapeValues; for (int j = 0; j < rank; j++) { if (j == axes[i]) { zerosShapeValues.push_back(outputDimSize); } else { Value dimSize = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(j))); zerosShapeValues.push_back(dimSize); } } Value zerosShapeList = rewriter.create( binder.getLoc(), rewriter.getType( rewriter.getType()), zerosShapeValues); Value zeros = rewriter.create( binder.getLoc(), opType, zerosShapeList, none, none, none, none); input = rewriter.create( binder.getLoc(), opType, zeros, input, axis, start, end, cstOne); } } rewriter.replaceOp(binder.op, input); return success(); }); patterns.onOp( "Clip", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { // https://onnx.ai/onnx/operators/onnx__Clip.html // Inputs and outputs must be tensors. Value source; Torch::ValueTensorType resultType; if (binder.tensorOperandAtIndex(source, 0) || binder.tensorResultType(resultType)) { return failure(); } // Min and max can be args (version 11+) or attributes (version 6-). // They default to numeric_limits::lowest() and numeric_limits::max(). Value min; Value max; if (binder.op->getNumOperands() >= 2) min = binder.op->getOperand(1); if (binder.op->getNumOperands() == 3) max = binder.op->getOperand(2); // Note: attribute versions of the op only support float types. auto resultDtype = resultType.getDtype(); if (!min && binder.op->hasAttr("torch.onnx.min")) { float minValue; if (binder.f32FloatAttr(minValue, "min", std::numeric_limits::lowest())) return failure(); auto minSplatAttr = SplatElementsAttr::get( resultType.toBuiltinTensor(), rewriter.getFloatAttr(resultDtype, minValue)); min = rewriter.create( binder.getLoc(), resultType, minSplatAttr); } if (!max && binder.op->hasAttr("torch.onnx.max")) { float maxValue; if (binder.f32FloatAttr(maxValue, "max", std::numeric_limits::max())) return failure(); auto maxSplatAttr = SplatElementsAttr::get( resultType.toBuiltinTensor(), rewriter.getFloatAttr(resultDtype, maxValue)); max = rewriter.create( binder.getLoc(), resultType, maxSplatAttr); } if (!min && !max) { // Cliping with no limits is a no-op. rewriter.replaceOp(binder.op, source); return success(); } if (!max) { rewriter.replaceOpWithNewOp( binder.op, resultType, source, min); return success(); } rewriter.replaceOpWithNewOp( binder.op, resultType, source, min, max); return success(); }); patterns.onOp( "Compress", 9, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand, conditionTensor; int64_t axis; if (binder.tensorOperands(operand, conditionTensor) || binder.s64IntegerAttr(axis, "axis", INT64_MAX) || binder.tensorResultType(resultType)) return failure(); auto shapeSizes = dyn_cast(operand.getType()).getSizes(); auto resultSizes = resultType.getSizes(); // flatten input tensor if using default axis if (axis == INT64_MAX) { SmallVector nonzeroShape = {resultSizes[0]}; auto dtype = dyn_cast(conditionTensor.getType()) .getDtype(); auto nonzeroType = rewriter.getType(nonzeroShape, dtype); Value indexVal = rewriter.create( binder.getLoc(), nonzeroType, conditionTensor); Value cstZero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); Value cstNegOne = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(-1)); int64_t numElements = 1; for (auto i : shapeSizes) { numElements *= i; } SmallVector flattenShape = {numElements}; auto flattenType = rewriter.getType( flattenShape, resultType.getDtype()); Value flattenTensor = rewriter.create( binder.getLoc(), flattenType, operand, cstZero, cstNegOne); rewriter.replaceOpWithNewOp( binder.op, resultType, flattenTensor, cstZero, indexVal); return success(); } // Negative axis value means counting dimensions from the back if (axis < 0) axis += shapeSizes.size(); SmallVector nonzeroShape = {resultSizes[axis]}; auto dtype = dyn_cast(conditionTensor.getType()) .getDtype(); auto nonzeroType = rewriter.getType(nonzeroShape, dtype); Value indexVal = rewriter.create( binder.getLoc(), nonzeroType, conditionTensor); Value dimVal = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(axis)); rewriter.replaceOpWithNewOp( binder.op, resultType, operand, dimVal, indexVal); return success(); }); patterns.onOp( "Concat", 11, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; SmallVector tensors; int64_t dim; if (binder.tensorOperands(tensors, binder.op->getNumOperands()) || binder.s64IntegerAttr(dim, "axis", 0) || binder.tensorResultType(resultType)) return failure(); Type listElemType = cast(tensors[0].getType()) .getWithSizesAndDtype(/*optionalSizes=*/std::nullopt, /*optionalDtype=*/nullptr); Type listType = Torch::ListType::get(listElemType); Value tensorList = rewriter.create( binder.op->getLoc(), listType, tensors); Value cstDim = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(dim)); rewriter.replaceOpWithNewOp(binder.op, resultType, tensorList, cstDim); return success(); }); patterns.onOp( "Constant", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; if (binder.tensorResultType(resultType)) return failure(); auto dtype = resultType.getDtype(); float floatValue; if (binder.op->hasAttr("torch.onnx.value_float") && !binder.f32FloatAttr(floatValue, "value_float", 0.0)) { auto splatAttr = SplatElementsAttr::get(resultType.toBuiltinTensor(), rewriter.getFloatAttr(dtype, floatValue)); rewriter.replaceOpWithNewOp( binder.op, resultType, splatAttr); return success(); } int64_t intValue; if (binder.op->hasAttr("torch.onnx.value_int") && !binder.s64IntegerAttr(intValue, "value_int", 0)) { auto splatAttr = SplatElementsAttr::get(resultType.toBuiltinTensor(), rewriter.getIntegerAttr(dtype, intValue)); rewriter.replaceOpWithNewOp( binder.op, resultType, splatAttr); return success(); } if (DenseResourceElementsAttr attr = dyn_cast_or_null( binder.op->getAttr("torch.onnx.value"))) { // Bytes are stored in little endian order. Big endian support will // require swizzling. if (!Endian::little) { binder.op->emitError( "unimplemented: importing on big endian systems"); return failure(); } auto ty = cast(attr.getType()); ElementsAttr denseAttr; auto ptr = attr.getRawHandle().getBlob(); if (!ptr) { denseAttr = DenseResourceElementsAttr::get( ty, "__onnx_constant_not_found_possibly_due_to_being_elided__", AsmResourceBlob()); rewriter.replaceOpWithNewOp( binder.op, resultType, denseAttr); return success(); } auto data = ptr->getData(); if (cast(attr.getType()).getElementType().isInteger(1)) { llvm::SmallVector newContents; for (auto val : data) { APInt apval(1, val); newContents.push_back(apval); } denseAttr = DenseElementsAttr::get(ty, newContents); } else { denseAttr = DenseElementsAttr::getFromRawBuffer(ty, data); } rewriter.replaceOpWithNewOp( binder.op, resultType, denseAttr); return success(); } if (ElementsAttr attr = dyn_cast_or_null( binder.op->getAttr("torch.onnx.value"))) { rewriter.replaceOpWithNewOp( binder.op, resultType, attr); return success(); } llvm::SmallVector intValues; if (!binder.s64IntegerArrayAttr(intValues, "value_ints", {}) && !intValues.empty()) { llvm::SmallVector apValues; for (auto intVal : intValues) { apValues.push_back(APInt(dtype.getIntOrFloatBitWidth(), intVal)); } auto attr = DenseElementsAttr::get(resultType.toBuiltinTensor(), apValues); rewriter.replaceOpWithNewOp( binder.op, resultType, attr); return success(); } return failure(); }); patterns.onOp( "Col2Im", 18, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input, blockShape, imageShape; SmallVector dilations, strides, pads; // TODO: The length of dilations should be len(imageShape), and the same // goes for strides. The length of pads should be 2 * len(imageShape). // But, as at the moment we are only supporting 3D or 4D input, // len(imageShape) must necessarily be 2, hence the lengths of the // default values. if (binder.tensorOperandAtIndex(input, 0) || binder.tensorOperandAtIndex(imageShape, 1) || binder.tensorOperandAtIndex(blockShape, 2) || binder.tensorResultType(resultType) || binder.s64IntegerArrayAttr(dilations, "dilations", SmallVector{1, 1}) || binder.s64IntegerArrayAttr(strides, "strides", SmallVector{1, 1}) || binder.s64IntegerArrayAttr(pads, "pads", SmallVector{0, 0, 0, 0})) return failure(); auto imageShapeTy = cast(imageShape.getType()); auto imageShapeSizes = imageShapeTy.getSizes(); auto blockShapeTy = cast(blockShape.getType()); auto blockShapeSizes = blockShapeTy.getSizes(); // Check that neither imageShape nor blockShape have dynamic shapes. if (imageShapeSizes[0] == Torch::kUnknownSize || blockShapeSizes[0] == Torch::kUnknownSize) { return rewriter.notifyMatchFailure( binder.op, "Dynamic shapes are not allowed for imageShape and blockShape"); } // TODO: Add support for 5D input tensors. if (imageShapeSizes[0] != 2) { return rewriter.notifyMatchFailure( binder.op, "Expected length of imageShape to be equal to 2"); } if (blockShapeSizes[0] != 2) { return rewriter.notifyMatchFailure( binder.op, "Expected length of blockShape to be equal to 2"); } if (dilations.size() != 2) { return rewriter.notifyMatchFailure( binder.op, "Expected length of dilations to be equal to 2"); } if (strides.size() != 2) { return rewriter.notifyMatchFailure( binder.op, "Expected length of strides to be equal to 2"); } // TODO: Disable this check and add support for different // paddings on lower and higher ends of each axis. // Because we have already checked that imageShape has 2 elements, // we can safely assume that len(padding) will be 4. if (pads[0] != pads[2] || pads[1] != pads[3]) return rewriter.notifyMatchFailure( binder.op, "padding on the lower end and the higher end " "on each axis should be the same"); // Since we know that the padding on the lower end and the higher // end on each axis is the same, we can reduce the size of the // padding list, and filter out the duplicate elements. // (Also, Torch::AtenCol2imOp requires len(padding) to be 2). SmallVector padOnEachAxis = {pads[0], pads[1]}; Value dilationsList = createConstantIntList(binder, rewriter, dilations); Value stridesList = createConstantIntList(binder, rewriter, strides); Value paddingList = createConstantIntList(binder, rewriter, padOnEachAxis); Value zero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); // Index the imageShape and blockShape tensors, as AtenCol2imOp expects // them to be int lists. auto select = [&](Value v, Value k, Torch::ValueTensorType ty) -> Value { Value kTensor = rewriter.create( binder.getLoc(), Torch::ValueTensorType::get( binder.op->getContext(), ArrayRef{1}, rewriter.getIntegerType(64, /*signed*/ 1)), k); auto sel = rewriter.create( binder.getLoc(), Torch::ValueTensorType::get(ty.getContext(), ArrayRef{1}, ty.getOptionalDtype()), v, zero, kTensor); Value item = rewriter.create( binder.getLoc(), rewriter.getType(), sel); return item; }; SmallVector imageShapeContainer, blockShapeContainer; for (int64_t i = 0; i < imageShapeSizes[0]; ++i) { Value k = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i)); // Passing in the shapeType of each of these tensors avoids // repeated casts, as these have already been calculated. imageShapeContainer.push_back(select(imageShape, k, imageShapeTy)); blockShapeContainer.push_back(select(blockShape, k, blockShapeTy)); } Value imageShapeAsList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), imageShapeContainer); Value blockShapeAsList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), blockShapeContainer); rewriter.replaceOpWithNewOp( binder.op, resultType, input, imageShapeAsList, blockShapeAsList, dilationsList, paddingList, stridesList); return success(); }); patterns.onOp( "Conv", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { std::string autoPad; if (binder.customOpNameStringAttr(autoPad, "auto_pad", "NOTSET")) return failure(); if (autoPad != "NOTSET") { // TODO: Add support for `auto_pad` != "NOTSET" return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: auto_pad != NOTSET"); } Torch::ValueTensorType resultType; Value input, weight; int64_t group; if (binder.tensorOperandAtIndex(input, 0) || binder.tensorOperandAtIndex(weight, 1) || binder.s64IntegerAttr(group, "group", 1) || binder.tensorResultType(resultType)) return failure(); auto weightTensorType = cast(weight.getType()); if (!weightTensorType || !weightTensorType.hasSizes()) { return rewriter.notifyMatchFailure( binder.op, "Expected weight type having sizes"); } ArrayRef weightShape = weightTensorType.getSizes(); SmallVector kernelShape; if (binder.s64IntegerArrayAttr(kernelShape, "kernel_shape", {})) return failure(); if (kernelShape.size()) { if (kernelShape.size() != weightShape.size() - 2) { return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape list size should have " "number of values equal to weight_rank - 2"); } else { for (unsigned i = 0; i < kernelShape.size(); i++) { if (weightShape[i + 2] != kernelShape[i]) { return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape value " "should be equal to the weight tensor shape"); } } } } // Determine the rank of input tensor. std::optional maybeRank = Torch::getTensorRank(input); if (!maybeRank) return rewriter.notifyMatchFailure(binder.op, "Unimplemented: unranked tensor"); unsigned rank = *maybeRank; SmallVector padding, strides, dilations; SmallVector defaultPadding, defaultStrides, defaultDilations; for (unsigned i = 0; i < rank - 2; i++) { defaultPadding.push_back(0); defaultStrides.push_back(1); defaultDilations.push_back(1); } // Padding for the beginning and ending along each spatial axis, it can // take any value greater than or equal to 0. The value represent the // number of pixels added to the beginning and end part of the // corresponding axis. pads format should be as follow [x1_begin, // x2_begin…x1_end, x2_end,…], where xi_begin the number of pixels added // at the beginning of axis i and xi_end, the number of pixels added at // the end of axis i. if (binder.s64IntegerArrayAttr(padding, "pads", defaultPadding)) { return failure(); } if (padding.size() != rank - 2 && padding.size() != 2 * (rank - 2)) { return rewriter.notifyMatchFailure( binder.op, "padding list size does not match the number of axes"); } if (binder.s64IntegerArrayAttr(dilations, "dilations", defaultDilations)) { return failure(); } if (dilations.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "dilations list size does not match the number of axes"); } if (binder.s64IntegerArrayAttr(strides, "strides", defaultStrides)) { return failure(); } if (strides.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "strides list size does not match the number of axes"); } SmallVector cstPadding, cstStrides, cstDilations, cstOutputPadding; Value paddedInput = input; Value paddingList; if (padding.size() != 2 * (rank - 2)) { for (int64_t i : padding) { cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } paddingList = rewriter.create( binder.getLoc(), Torch::ListType::get( Torch::IntType::get(binder.op->getContext())), cstPadding); } else { // ONNX offers pads in the format listing all starting dims, then all // ending dims, e.g. {t, l, b, r} for conv2d. Torch by default accepts // only starting dims, e.g. {t, l}. However, we can support padding at // the beginning and end of each dimension by first performing // torch.nn.functional.pad on the input. But this requires the pad // values to be rearranged since torch pad() takes pads in the order // rightmost dim start and end, then next to last, and so on, e.g. {l, // r, t, b}. bool matchedPads = true; for (unsigned i = 0; i < padding.size() / 2; i++) { if (padding[i] != padding[i + (padding.size() / 2)]) { matchedPads = false; break; } } if (matchedPads) { for (unsigned i = 0; i < padding.size() / 2; i++) { cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(padding[i]))); } paddingList = rewriter.create( binder.getLoc(), Torch::ListType::get( Torch::IntType::get(binder.op->getContext())), cstPadding); } else { SmallVector padsRearrange; SmallVector inputPaddingList; for (uint32_t i = 0; i < padding.size() / 2; i++) { padsRearrange.emplace_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr( padding[padding.size() / 2 - i - 1]))); padsRearrange.emplace_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(padding[padding.size() - i - 1]))); inputPaddingList.emplace_back( rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0))); } // The conv op itself will have no padding since the actual padding // is performed using the torch.pad preceding it. paddingList = rewriter.create( binder.getLoc(), Torch::ListType::get( Torch::IntType::get(binder.op->getContext())), inputPaddingList); Value padsSizeList = rewriter .create( binder.getLoc(), Torch::ListType::get( rewriter.getType()), padsRearrange) .getResult(); Value modeVal = rewriter.create( binder.getLoc(), rewriter.getStringAttr("constant")); Value constantValue; auto inputTensorType = cast(input.getType()); if (isa(inputTensorType.getDtype())) constantValue = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); if (isa(inputTensorType.getDtype())) constantValue = rewriter.create( binder.getLoc(), rewriter.getF64FloatAttr(0.0f)); // Pad output shape must be computed explicitly from the pad values SmallVector newInputShape(inputTensorType.getSizes()); for (uint32_t i = 0; i < padding.size() / 2; i++) { newInputShape[2 + i] += padding[i] + padding[(padding.size() / 2) + i]; } auto padTy = rewriter.getType( newInputShape, inputTensorType.getDtype()); paddedInput = rewriter.create( binder.getLoc(), padTy, input, padsSizeList, modeVal, constantValue); } } for (int64_t i : dilations) { cstDilations.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } for (int64_t i : strides) { cstStrides.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } Value cstZero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); cstOutputPadding = {cstZero, cstZero}; Value dilationsList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstDilations); Value stridesList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstStrides); Value outputPaddingList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstOutputPadding); Value transposed = rewriter.create(binder.getLoc(), false); Value bias; if (binder.op->getNumOperands() == 3) { if (binder.tensorOperandAtIndex(bias, 2)) { return failure(); } } else { bias = rewriter.create(binder.getLoc()); } Value cstGroup = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(group)); rewriter.replaceOpWithNewOp( binder.op, resultType, paddedInput, weight, bias, stridesList, paddingList, dilationsList, transposed, outputPaddingList, cstGroup); return success(); }); patterns.onOp( "ConvInteger", 10, [](OpBinder binder, ConversionPatternRewriter &rewriter) { std::string autoPad; if (binder.customOpNameStringAttr(autoPad, "auto_pad", "NOTSET")) return failure(); if (autoPad != "NOTSET") // TODO: Add support for `auto_pad` != "NOTSET" return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: auto_pad != NOTSET"); Torch::ValueTensorType resultType; Value input, weight, inputZp, weightZp; int64_t group; if (binder.tensorOperandAtIndex(input, 0) || binder.tensorOperandAtIndex(weight, 1) || binder.s64IntegerAttr(group, "group", 1) || binder.tensorResultType(resultType)) return failure(); auto inputTy = dyn_cast(input.getType()); auto weightTy = dyn_cast(weight.getType()); if (!weightTy || !weightTy.hasSizes()) return rewriter.notifyMatchFailure( binder.op, "Expected weight type having sizes"); ArrayRef weightShape = weightTy.getSizes(); SmallVector kernelShape; if (binder.s64IntegerArrayAttr(kernelShape, "kernel_shape", {})) return failure(); if (kernelShape.size()) { if (kernelShape.size() != weightShape.size() - 2) { return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape list size should have " "number of values equal to weight_rank - 2"); } else { for (unsigned i = 0; i < kernelShape.size(); i++) { if (weightShape[i + 2] != kernelShape[i]) return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape value " "should be equal to the weight tensor shape"); } } } // Determine the rank of input tensor. std::optional maybeRank = Torch::getTensorRank(input); if (!maybeRank) return rewriter.notifyMatchFailure(binder.op, "Unimplemented: unranked tensor"); unsigned rank = *maybeRank; SmallVector padding, strides, dilations; SmallVector defaultPadding(rank - 2, 0), defaultStrides(rank - 2, 1), defaultDilations(rank - 2, 1); // Padding for the beginning and ending along each spatial axis, it can // take any value greater than or equal to 0. The value represent the // number of pixels added to the beginning and end part of the // corresponding axis. pads format should be as follow [x1_begin, // x2_begin…x1_end, x2_end,…], where xi_begin the number of pixels added // at the beginning of axis i and xi_end, the number of pixels added at // the end of axis i. if (binder.s64IntegerArrayAttr(padding, "pads", defaultPadding)) return failure(); if (padding.size() != rank - 2 && padding.size() != 2 * (rank - 2)) return rewriter.notifyMatchFailure( binder.op, "padding list size does not match the number of axes"); if (binder.s64IntegerArrayAttr(dilations, "dilations", defaultDilations)) return failure(); if (dilations.size() != rank - 2) return rewriter.notifyMatchFailure( binder.op, "dilations list size does not match the number of axes"); if (binder.s64IntegerArrayAttr(strides, "strides", defaultStrides)) return failure(); if (strides.size() != rank - 2) return rewriter.notifyMatchFailure( binder.op, "strides list size does not match the number of axes"); Value scale = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getF64FloatAttr(1.0)); if (binder.tensorOperandAtIndex(inputZp, 2)) { inputZp = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); } else { inputZp = rewriter.create( binder.getLoc(), rewriter.getType(), inputZp); } if (binder.tensorOperandAtIndex(weightZp, 3)) weightZp = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); // TODO: support per channel quantization if weightZp is a 1-D tensor if (auto zpTy = dyn_cast(weightZp.getType())) { for (auto dim : zpTy.getSizes()) if (dim != 1) return failure(); weightZp = rewriter.create( binder.getLoc(), rewriter.getType(), weightZp); } SmallVector cstPadding; if (padding.size() != 2 * (rank - 2)) { for (int64_t i : padding) { cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } } else { for (unsigned i = 0; i < padding.size() / 2; i++) { if (padding[i] != padding[i + (padding.size() / 2)]) // TODO: Add support for different padding values for the // beginning and ending along each spatial axis return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: padding values for the beginning " "and ending along each spatial axis must be equal"); cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(padding[i]))); } } Value paddingList = rewriter.create( binder.getLoc(), rewriter.getType( rewriter.getType()), cstPadding); Value dilationsList = createConstantIntList(binder, rewriter, dilations); Value stridesList = createConstantIntList(binder, rewriter, strides); Value outputPaddingList = createConstantIntList(binder, rewriter, {0, 0}); Value transposed = rewriter.create(binder.getLoc(), false); Value bias = rewriter.create(binder.getLoc()); Value cstGroup = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(group)); Type inputQTy = getQTorchTypeFromTorchIntType(inputTy); Type weightQTy = getQTorchTypeFromTorchIntType(weightTy); input = rewriter.create( binder.getLoc(), inputQTy, input, scale, inputZp); weight = rewriter.create( binder.getLoc(), weightQTy, weight, scale, weightZp); rewriter.replaceOpWithNewOp( binder.op, resultType, input, weight, bias, stridesList, paddingList, dilationsList, transposed, outputPaddingList, cstGroup); return success(); }); patterns.onOp( "ConvTranspose", 11, [](OpBinder binder, ConversionPatternRewriter &rewriter) { std::string autoPad; if (binder.customOpNameStringAttr(autoPad, "auto_pad", "NOTSET")) return failure(); if (autoPad != "NOTSET") { // TODO: Add support for `auto_pad` != "NOTSET" return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: auto_pad != NOTSET"); } SmallVector outputShape; if (binder.s64IntegerArrayAttr(outputShape, "output_shape", {})) return failure(); if (outputShape.size()) { // TODO: Add support for non-None output_shape value. return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: output_shape should be absent"); } Torch::ValueTensorType resultType; Value input, weight; int64_t group; if (binder.tensorOperandAtIndex(input, 0) || binder.tensorOperandAtIndex(weight, 1) || binder.s64IntegerAttr(group, "group", 1) || binder.tensorResultType(resultType)) return failure(); auto weightTensorType = cast(weight.getType()); if (!weightTensorType || !weightTensorType.hasSizes()) { return rewriter.notifyMatchFailure( binder.op, "Expected weight type having sizes"); } ArrayRef weightShape = weightTensorType.getSizes(); SmallVector kernelShape; if (binder.s64IntegerArrayAttr(kernelShape, "kernel_shape", {})) return failure(); if (kernelShape.size()) { if (kernelShape.size() != weightShape.size() - 2) { return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape list size should have " "number of values equal to weight_rank - 2"); } else { for (unsigned i = 0; i < kernelShape.size(); i++) { if (weightShape[i + 2] != kernelShape[i]) { return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: kernel_shape value " "should be equal to the weight tensor shape"); } } } } // Determine the rank of input tensor. std::optional maybeRank = Torch::getTensorRank(input); if (!maybeRank) return rewriter.notifyMatchFailure(binder.op, "Unimplemented: unranked tensor"); unsigned rank = *maybeRank; SmallVector padding, strides, dilations, outputPadding; SmallVector defaultPadding, defaultStrides, defaultDilations, defaultOutputPadding; for (unsigned i = 0; i < rank - 2; i++) { defaultPadding.push_back(0); defaultStrides.push_back(1); defaultDilations.push_back(1); defaultOutputPadding.push_back(0); } // Padding for the beginning and ending along each spatial axis, it can // take any value greater than or equal to 0. The value represent the // number of pixels added to the beginning and end part of the // corresponding axis. pads format should be as follow [x1_begin, // x2_begin…x1_end, x2_end,…], where xi_begin the number of pixels added // at the beginning of axis i and xi_end, the number of pixels added at // the end of axis i. if (binder.s64IntegerArrayAttr(padding, "pads", defaultPadding)) { return failure(); } if (padding.size() != rank - 2 && padding.size() != 2 * (rank - 2)) { return rewriter.notifyMatchFailure( binder.op, "padding list size does not match the number of axes"); } if (binder.s64IntegerArrayAttr(dilations, "dilations", defaultDilations)) { return failure(); } if (dilations.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "dilations list size does not match the number of axes"); } if (binder.s64IntegerArrayAttr(strides, "strides", defaultStrides)) { return failure(); } if (strides.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "strides list size does not match the number of axes"); } if (binder.s64IntegerArrayAttr(outputPadding, "output_padding", defaultOutputPadding)) { return failure(); } if (outputPadding.size() != rank - 2) { return rewriter.notifyMatchFailure( binder.op, "output_padding list size does not match the number of axes"); } SmallVector cstPadding, cstStrides, cstDilations, cstOutputPadding; if (padding.size() != 2 * (rank - 2)) { for (int64_t i : padding) { cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } } else { for (unsigned i = 0; i < padding.size() / 2; i++) { if (padding[i] != padding[i + (padding.size() / 2)]) { // TODO: Add support for different padding values for the // beginning and ending along each spatial axis return rewriter.notifyMatchFailure( binder.op, "unsupported conversion: padding values for the beginning " "and ending along each spatial axis must be equal"); } cstPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(padding[i]))); } } for (int64_t i : dilations) { cstDilations.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } for (int64_t i : strides) { cstStrides.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } for (int64_t i : outputPadding) { cstOutputPadding.push_back(rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(i))); } Value paddingList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstPadding); Value dilationsList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstDilations); Value stridesList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstStrides); Value outputPaddingList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(binder.op->getContext())), cstOutputPadding); Value transposed = rewriter.create(binder.getLoc(), true); Value bias; if (binder.op->getNumOperands() == 3) { if (binder.tensorOperandAtIndex(bias, 2)) { return failure(); } } else { bias = rewriter.create(binder.getLoc()); } Value cstGroup = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(group)); rewriter.replaceOpWithNewOp( binder.op, resultType, input, weight, bias, stridesList, paddingList, dilationsList, transposed, outputPaddingList, cstGroup); return success(); }); patterns.onOp("Cos", 7, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp("Cosh", 9, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand; if (binder.tensorOperand(operand) || binder.tensorResultType(resultType)) return failure(); rewriter.replaceOpWithNewOp( binder.op, resultType, operand); return success(); }); patterns.onOp( "CumSum", 11, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value operand, axisTensor; int64_t exclusive, reverse; if (binder.tensorOperands(operand, axisTensor) || binder.s64IntegerAttr(exclusive, "exclusive", 0) || binder.s64IntegerAttr(reverse, "reverse", 0) || binder.tensorResultType(resultType)) return failure(); Torch::BaseTensorType resultTensorType = cast(resultType); if (!resultTensorType.hasDtype()) { return rewriter.notifyMatchFailure( binder.op, "expected result type to have a dtype"); } // deal with neg axis: if (axis < 0) axis += rank int64_t rank = cast(operand.getType()).getSizes().size(); Value rankVal = rewriter.create( binder.getLoc(), rewriter.getType(), rewriter.getIntegerAttr(rewriter.getIntegerType(64), rank)); Value cstZero = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0)); Value cstOne = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1)); Value axisScalar = rewriter.create( binder.getLoc(), rewriter.getType(), axisTensor); Value isNegative = rewriter.create( binder.getLoc(), axisScalar, cstZero); isNegative = rewriter.create(binder.getLoc(), isNegative); Value finalOffset = rewriter.create( binder.getLoc(), isNegative, rankVal); Value axis = rewriter.create( binder.getLoc(), axisScalar, finalOffset); Value none = rewriter.create(binder.getLoc()); Value res; if (reverse) { Value dims = rewriter.create( binder.getLoc(), rewriter.getType( rewriter.getType()), SmallVector{axis}); Value flip = rewriter.create( binder.getLoc(), resultType, operand, dims); Value cumsum = rewriter.create( binder.getLoc(), resultType, flip, axis, none); res = rewriter.create(binder.getLoc(), resultType, cumsum, dims); } else { res = rewriter.create( binder.getLoc(), resultType, operand, axis, none); } if (exclusive) res = rewriter.create( binder.getLoc(), resultType, res, operand, cstOne); rewriter.replaceOp(binder.op, res); return success(); }); patterns.onOp( "DepthToSpace", 1, [](OpBinder binder, ConversionPatternRewriter &rewriter) { Torch::ValueTensorType resultType; Value input; int64_t blockSize; std::string mode; if (binder.tensorOperand(input) || binder.s64IntegerAttr(blockSize, "blocksize") || binder.customOpNameStringAttr(mode, "mode", "DCR") || binder.tensorResultType(resultType)) return failure(); auto inputTy = dyn_cast(input.getType()); if (!inputTy || !inputTy.hasSizes()) { return rewriter.notifyMatchFailure( binder.op, "Expected input type having sizes"); } SmallVector inputSizes{inputTy.getSizes()}; if (inputSizes.size() != 4) { return rewriter.notifyMatchFailure(binder.op, "Expected input rank to be 4"); } Value b = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(0))); Value c = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(1))); Value h = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(2))); Value w = rewriter.create( binder.getLoc(), input, rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(3))); Value cstBlockSize = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(blockSize)); Value cstBlockSizeSquare = rewriter.create( binder.getLoc(), rewriter.getI64IntegerAttr(blockSize * blockSize)); Value cDivBlockSizeSquare = rewriter.create( binder.getLoc(), c, cstBlockSizeSquare); cDivBlockSizeSquare = rewriter.create( binder.getLoc(), cDivBlockSizeSquare); Value reshapeSizesList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(input.getContext())), llvm::SmallVector{b, cstBlockSize, cstBlockSize, cDivBlockSizeSquare, h, w}); int64_t cDivBlockSizeSquareInt = inputSizes[1] == Torch::kUnknownSize ? Torch::kUnknownSize : inputSizes[1] / (blockSize * blockSize); SmallVector reshapeSizesInt{ inputSizes[0], blockSize, blockSize, cDivBlockSizeSquareInt, inputSizes[2], inputSizes[3]}; Value reshapedInput = rewriter.create( binder.getLoc(), inputTy.getWithSizesAndDtype(reshapeSizesInt, inputTy.getOptionalDtype()), input, reshapeSizesList); Value transposedInput; if (mode == "DCR") { if (failed(createTorchTransposeOp( rewriter, binder.getLoc(), reshapedInput, /*dimA=*/1, /*dimB=*/3, transposedInput))) return rewriter.notifyMatchFailure( binder.op, "Failed to create TorchTranspose op"); if (failed(createTorchTransposeOp( rewriter, binder.getLoc(), transposedInput, /*dimA=*/2, /*dimB=*/4, transposedInput))) return rewriter.notifyMatchFailure( binder.op, "Failed to create TorchTranspose op"); } else { // mode == "CRD" if (failed(createTorchTransposeOp( rewriter, binder.getLoc(), reshapedInput, /*dimA=*/2, /*dimB=*/4, transposedInput))) return rewriter.notifyMatchFailure( binder.op, "Failed to create TorchTranspose op"); if (failed(createTorchTransposeOp( rewriter, binder.getLoc(), transposedInput, /*dimA=*/3, /*dimB=*/4, transposedInput))) return rewriter.notifyMatchFailure( binder.op, "Failed to create TorchTranspose op"); } if (failed(createTorchTransposeOp( rewriter, binder.getLoc(), transposedInput, /*dimA=*/4, /*dimB=*/5, transposedInput))) return rewriter.notifyMatchFailure( binder.op, "Failed to create TorchTranspose op"); Value hMulBlockSize = rewriter.create( binder.getLoc(), h, cstBlockSize); Value wMulBlockSize = rewriter.create( binder.getLoc(), w, cstBlockSize); reshapeSizesList = rewriter.create( binder.getLoc(), Torch::ListType::get(Torch::IntType::get(input.getContext())), llvm::SmallVector{b, cDivBlockSizeSquare, hMulBlockSize, wMulBlockSize}); rewriter.replaceOpWithNewOp( binder.op, resultType, transposedInput, reshapeSizesList); return success(); }); patterns.onOp( "DeformConv", 19, [](OpBinder binder, ConversionPatternRewriter &rewriter) { auto loc = binder.getLoc(); // get operands llvm::SmallVector operands; Torch::ValueTensorType resultType; if (binder.tensorOperandsList(operands) || binder.tensorResultType(resultType)) return failure(); if (operands.size() < 3 || operands.size() > 5) return failure(); auto inputType = dyn_cast(operands[0].getType()); if (!inputType || !inputType.hasSizes() || inputType.getSizes().size() != 4) return rewriter.notifyMatchFailure( binder.op, "Unsupported: DeformConv with input rank != 4"); unsigned rank = inputType.getSizes().size(); auto weightType = dyn_cast(operands[1].getType()); if (!weightType || !weightType.hasSizes()) return failure(); auto offsetType = dyn_cast(operands[2].getType()); if (!offsetType || !offsetType.hasSizes()) return failure(); // get attributes SmallVector dilations, kernelShape, pads, strides; SmallVector defaultDilations(rank - 2, 0); SmallVector defaultPads(2 * (rank - 2), 0); SmallVector defaultStrides(rank - 2, 1); int64_t group, offsetGroup; if (binder.s64IntegerArrayAttr(dilations, "dilations", defaultDilations) || binder.s64IntegerArrayAttr(kernelShape, "kernel_shape", {}) || binder.s64IntegerArrayAttr(pads, "pads", defaultPads) || binder.s64IntegerArrayAttr(strides, "strides", defaultStrides) || binder.s64IntegerAttr(group, "group", 1) || binder.s64IntegerAttr(offsetGroup, "offset_group", 1)) return failure(); for (unsigned i = 0; i < rank - 2; i++) { if (pads[i] != pads[rank + i - 2]) return rewriter.notifyMatchFailure( binder.op, "unsupported: asymmetric padding"); } // Identify and assign names to operands Value input, weight, offset, bias, mask; bool useMask = false; input = operands[0]; weight = operands[1]; offset = operands[2]; if (operands.size() == 4) { auto unknownOpdRank = Torch::getTensorRank(operands[3]); if (!unknownOpdRank) return failure(); if (*unknownOpdRank == 1) bias = operands[3]; else if (*unknownOpdRank == rank) { mask = operands[3]; useMask = true; } else llvm_unreachable("onnx.DeformConv: optional 4th operand of " "unexpected rank encountered"); } if (operands.size() == 5) { bias = operands[3]; mask = operands[4]; useMask = true; } // assign default operand values if necessary ArrayRef weightSizes = weightType.getSizes(); ArrayRef offsetSizes = offsetType.getSizes(); if (!bias) { int64_t outputChannels = weightSizes[0]; SmallVector biasShape(1, outputChannels); Value biasShapeList = mlir::torch::onnx_c::createConstantIntList( binder, rewriter, biasShape); Value cstZero = Torch::getConstantWithGivenDtypeAndValue( rewriter, loc, 0.0f, inputType.getDtype()); bias = Torch::createInitTensor(rewriter, loc, rewriter.getType( biasShape, inputType.getDtype()), cstZero, biasShapeList); } if (!mask) { int64_t batchSize = inputType.getSizes()[0]; int64_t kernelHeight = weightSizes[2]; int64_t kernelWidth = weightSizes[3]; int64_t outputHeight = offsetSizes[2]; int64_t outputWidth = offsetSizes[3]; int64_t maskDimOne = offsetGroup * kernelHeight * kernelWidth; SmallVector maskShape( {batchSize, maskDimOne, outputHeight, outputWidth}); Value cstOne = Torch::getConstantWithGivenDtypeAndValue( rewriter, loc, 1.0f, inputType.getDtype()); Value maskShapeList = mlir::torch::onnx_c::createConstantIntList( binder, rewriter, maskShape); mask = Torch::createInitTensor(rewriter, loc, rewriter.getType( maskShape, inputType.getDtype()), cstOne, maskShapeList); } // get attributes as constant values SmallVector dilationValues, padValues, strideValues; for (auto i : dilations) dilationValues.push_back(rewriter.create( loc, rewriter.getI64IntegerAttr(i))); for (auto i : pads) padValues.push_back(rewriter.create( loc, rewriter.getI64IntegerAttr(i))); for (auto i : strides) strideValues.push_back(rewriter.create( loc, rewriter.getI64IntegerAttr(i))); Value groupValue = rewriter.create