[Torch] Disable 1-d quantized convolution (#3601)

To fix https://github.com/nod-ai/SHARK-Turbine/issues/253#issuecomment-2271815640 Prevent fusion for 1d convolution ops and just do it as an f32 conv since there isn't a linalg named op for quantized 1-d convolution yet. Get 24 onnx eca* models passed in iree-comiple.
2024-08-07 09:01:16 -07:00 · 2024-08-07 09:01:16 -07:00 · a51b4e014a
parent 2d6bfb2dec
commit a51b4e014a
1 changed files with 9 additions and 0 deletions
--- a/lib/Dialect/Torch/Transforms/FuseQuantizedOps.cpp
+++ b/lib/Dialect/Torch/Transforms/FuseQuantizedOps.cpp
@ -63,6 +63,15 @@ public:
    llvm::SmallVector<Value> operands(op->getOperands());
    bool dequanted = false;
    // Prevent fusion for 1d convolution ops and just do it as an f32 conv since
    // there isn't a linalg named op for quantized 1-d convolution yet.
    // TODO: Remove this and add support for 1-d quantized convolution.
    int64_t inputRank =
        cast<ValueTensorType>(operands[0].getType()).getSizes().size();
    if (isa<Torch::AtenConvolutionOp>(op) && inputRank < 4)
      return rewriter.notifyMatchFailure(
          op, "1-d quantized convolution is not supported");
    for (unsigned i : QuantInfo<SrcOp>::operandsToQuantize) {
      Value operand = operands[i];
      std::stack<mlir::Operation *> commutingOpStack;