[onnx] Fix `onnx.RNN` for layout attribute (#3620)

The `layout` attribute was not considered for the `onnx.RNN` operation. Added support for the attribute to transpose the inputs / outputs of the RNN when valid.
2024-08-13 14:34:25 -07:00 · 2024-08-13 14:34:25 -07:00 · 2511cf46b4
parent af67f9efb0
commit 2511cf46b4
1 changed files with 52 additions and 2 deletions
--- a/lib/Conversion/TorchOnnxToTorch/OnnxRecurrentLayerOpExpanders.cpp
+++ b/lib/Conversion/TorchOnnxToTorch/OnnxRecurrentLayerOpExpanders.cpp
@ -151,6 +151,22 @@ RnnLayerOutput rnn_layer(ImplicitLocOpBuilder &b, Value X, Value initial_h,
  output.Y_h = loop.getResult(1);
  return output;
 }
+
+static Value StaticTranspose(ImplicitLocOpBuilder b, Value value, int64_t dim0,
+                             int64_t dim1) {
+  auto valueTy = cast<ValueTensorType>(value.getType());
+
+  SmallVector<int64_t> valueShape(valueTy.getSizes());
+  std::swap(valueShape[dim0], valueShape[dim1]);
+  valueTy = b.getType<ValueTensorType>(valueShape, valueTy.getDtype());
+
+  auto intType = b.getType<IntType>();
+  Value dim0v = b.create<ConstantIntOp>(intType, b.getI64IntegerAttr(dim0));
+  Value dim1v = b.create<ConstantIntOp>(intType, b.getI64IntegerAttr(dim1));
+
+  return b.create<AtenTransposeIntOp>(valueTy, value, dim0v, dim1v);
+}
+
 LogicalResult OnnxRnnExpander(OpBinder binder,
                              ConversionPatternRewriter &rewriter) {
  Location loc = binder.getLoc();
@ -201,9 +217,19 @@ LogicalResult OnnxRnnExpander(OpBinder binder,
    return rewriter.notifyMatchFailure(
        binder.op, "Missing required attribute hidden_size");

+  // Other attributes
+  int64_t layout;
+  if (binder.s64IntegerAttr(layout, "layout", 0))
+    return rewriter.notifyMatchFailure(binder.op,
+                                       "Unsupported layout attribute type.");
+
+  if (layout < 0 || layout > 1)
+    return rewriter.notifyMatchFailure(binder.op,
+                                       "Unsupported layout attribute value.");
+
  // Result types
  ValueTensorType yTy, Y_hType;
-  if (binder.tensorResultTypeAtIndex(yTy, 0) ||
+  if (binder.tensorResultTypeAtIndex(yTy, 0) &&
      binder.tensorResultTypeAtIndex(Y_hType, 1)) {
    return rewriter.notifyMatchFailure(binder.op,
                                       "At least one output must be present");
@ -229,6 +255,12 @@ LogicalResult OnnxRnnExpander(OpBinder binder,
    initial_h = nullptr;
  }

+  if (layout == 1) {
+    X = StaticTranspose(b, X, 0, 1);
+    if (initial_h)
+      initial_h = StaticTranspose(b, initial_h, 0, 1);
+  }
+
  // validation
  auto xTy = cast<ValueTensorType>(X.getType());
  auto wTy = cast<ValueTensorType>(W.getType());
@ -238,6 +270,7 @@ LogicalResult OnnxRnnExpander(OpBinder binder,
  auto rShape = rTy.getSizes();
  assert(wShape.size() == 3);

+  int64_t seq_len = xShape[0];
  int64_t batch_size = xShape[1];
  int64_t x_input_size = xShape[2];

@ -368,7 +401,24 @@ LogicalResult OnnxRnnExpander(OpBinder binder,
  Value Y_h_unsqueezed = b.create<AtenUnsqueezeOp>(Y_h_unsqueezed_type,
                                                   rnnLayerOutput.Y_h, cstZero);

-  Value Y_unsqueezed = b.create<AtenUnsqueezeOp>(yTy, rnnLayerOutput.Y, cstOne);
+  auto Y_unsqueezed_type = b.getType<ValueTensorType>(
+      llvm::SmallVector<int64_t>{seq_len, num_directions, batch_size,
+                                 hidden_size},
+      cast<ValueTensorType>(rnnLayerOutput.Y_h.getType()).getDtype());
+  Value Y_unsqueezed =
+      b.create<AtenUnsqueezeOp>(Y_unsqueezed_type, rnnLayerOutput.Y, cstOne);
+
+  if (layout == 1) {
+    Y_h_unsqueezed = StaticTranspose(b, Y_h_unsqueezed, 0, 1);
+    Y_unsqueezed = StaticTranspose(b, Y_unsqueezed, 1, 2);
+    Y_unsqueezed = StaticTranspose(b, Y_unsqueezed, 0, 1);
+  }
+
+  if (!yTy)
+    Y_unsqueezed = cstNone;
+  if (!Y_hType)
+    Y_h_unsqueezed = cstNone;
+
  rewriter.replaceOp(binder.op, {Y_unsqueezed, Y_h_unsqueezed});
  return success();
 }