torch-mlir/test/Dialect/Torch/func-builtin-tensorize.mlir

// RUN: npcomp-opt %s -torch-func-builtin-tensorize -split-input-file -verify-diagnostics -allow-unregistered-dialect | FileCheck %s

// This test is largely copied from `func-bufferize` upstream, as it covers
// the same scope.

// CHECK-LABEL:   func @identity(
// CHECK-SAME:                   %[[ARG:.*]]: tensor<f32>) -> tensor<f32> {
// CHECK:           %[[TENSOR:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>
// CHECK:           %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>
// CHECK:           return %[[MEMREF]] : tensor<f32>
func @identity(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {
  return %arg0 : !torch.vtensor<[],f32>
}

// CHECK-LABEL:   func @block_arguments(
// CHECK-SAME:        %[[ARG:.*]]: tensor<f32>) -> tensor<f32> {
// CHECK:           %[[T1:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>
// CHECK:           %[[M1:.*]] = torch.to_builtin_tensor %[[T1]] : !torch.vtensor<[],f32> -> tensor<f32>
// CHECK:           br ^bb1(%[[M1]] : tensor<f32>)
// CHECK:         ^bb1(%[[BBARG:.*]]: tensor<f32>):
// CHECK:           %[[T2:.*]] = torch.from_builtin_tensor %[[BBARG]] : tensor<f32> -> !torch.vtensor<[],f32>
// CHECK:           %[[M2:.*]] = torch.to_builtin_tensor %[[T2]] : !torch.vtensor<[],f32> -> tensor<f32>
// CHECK:           return %[[M2]] : tensor<f32>
func @block_arguments(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {
  br ^bb1(%arg0: !torch.vtensor<[],f32>)
^bb1(%bbarg: !torch.vtensor<[],f32>):
  return %bbarg : !torch.vtensor<[],f32>
}

// CHECK-LABEL:   func private @source() -> tensor<f32>
// CHECK-LABEL:   func @call_source() -> tensor<f32> {
// CHECK:           %[[RET:.*]] = call @source() : () -> tensor<f32>
// CHECK:           return %[[RET]] : tensor<f32>
func private @source() -> !torch.vtensor<[],f32>
func @call_source() -> !torch.vtensor<[],f32> {
  %0 = call @source() : () -> !torch.vtensor<[],f32>
  return %0 : !torch.vtensor<[],f32>
}
// CHECK-LABEL:   func @call_sink(
// CHECK-SAME:                    %[[ARG:.*]]: tensor<f32>) {
// CHECK:           %[[TENSOR:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>
// CHECK:           %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>
// CHECK:           call @sink(%[[MEMREF]]) : (tensor<f32>) -> ()
// CHECK:           return
func private @sink(!torch.vtensor<[],f32>)
func @call_sink(%arg0: !torch.vtensor<[],f32>) {
  call @sink(%arg0) : (!torch.vtensor<[],f32>) -> ()
  return
}

// CHECK-LABEL:   func @unconverted_op_in_body() -> tensor<f32> {
// CHECK:           %[[TENSOR:.*]] = "test.source"() : () -> !torch.vtensor<[],f32>
// CHECK:           %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>
// CHECK:           return %[[MEMREF]] : tensor<f32>
func @unconverted_op_in_body() -> !torch.vtensor<[],f32> {
  %0 = "test.source"() : () -> !torch.vtensor<[],f32>
  return %0 : !torch.vtensor<[],f32>
}

// -----

// Because this pass updates block arguments, it needs to also atomically
// update all terminators and issue an error if that is not possible.
func @unable_to_update_terminator(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {
    %0 = constant true
    cond_br %0, ^bb1(%arg0: !torch.vtensor<[],f32>), ^bb2(%arg0: !torch.vtensor<[],f32>)
  ^bb1(%bbarg0: !torch.vtensor<[],f32>):
    // expected-error @+1 {{failed to legalize operation 'test.terminator'}}
    "test.terminator"() : () -> ()
  ^bb2(%bbarg1: !torch.vtensor<[],f32>):
    return %bbarg1 : !torch.vtensor<[],f32>
}

// -----

// There was a bug in func-bufferize pass which caused terminators without
// ReturnLike and BranchOpInterface traits (e.g. scf.condition) to always
// fail to legalize even if bufferization doesn't needed.
// Check the pass succedeed.
// CHECK: while
// CHECK: scf.while
// CHECK: scf.condition
func @bwhile(%arg0: i64, %arg1: i64) -> i64 {
  %c2_i64 = constant 2 : i64
  %0:2 = scf.while (%arg2 = %arg0) : (i64) -> (i64, i64) {
    %1 = cmpi slt, %arg2, %arg1 : i64
    scf.condition(%1) %arg2, %arg2 : i64, i64
  } do {
  ^bb0(%arg2: i64, %arg3: i64):
    %1 = muli %arg3, %c2_i64 : i64
    scf.yield %1 : i64
  }
  return %0#1 : i64
}
Introduce `!torch.tensor` / `!torch.vtensor` types. This removes our reliance on the numpy dialect and avoids our off-label use of the builtin tnesor type for modeling unknown dtypes. The `!torch.vtensor` (`ValueTensorType`) type is a value-semantic tensor. The `!torch.tensor` (`NonValueTensorType`) type is a non-value-semantic tensor. The new types look as follows syntactically: ``` // Least-static-information, non-value-semantic tensor. !torch.tensor // Explicit form of least-static-information variant. !torch.tensor<,unk> // Least-static-information, value-semantic tensor. !torch.vtensor // Explicit form of least-static-information variant. !torch.vtensor<,unk> // Fixed-set of allowable element types, with first-class support for // Torch's frontend signedness semantics. !torch.tensor<*,si32> // First-class support for unknown dtypes. !torch.tensor<[?,?,?],unk> // Standard MLIR representation of `?` for unknown dimensions. !torch.tensor<[?,2,?,4],unk> // Statically shaped / dtyped example. !torch.vtensor<[1,2,3,4],f32> ``` This required fairly significant changes throughout the compiler, but overall it is a big cleanup. We now have a much clearer layering of "the Torch frontend lowering" vs "lowering to std + linalg + etc.". At the C++ level, there is `ValueTensorType`, `NonValueTensorType`. We also have a helper `BaseTensorType` (kind of like ShapedType) which interoperates with those two. Included changes: - New `torch.tensor(dense<0.0> : tensor<5xf32>) : !torch.tensor` op for creating torch tensor literals in the frontend. - Consistently use signedness for the types (except i1 which I didn't touch -- we need to sort out the situation with !basicpy.BoolType there anyway so will be attending to that soon) - Frontend can annotate whether an argument to the function has value semantics. We currently require this, as our backend contract does not currently allow us to even model the non-value-semantic case. Before, the value-semantic assumption was randomly injected in the middle of the pass pipeline. - Move ArrayToTensor (now called MaximizeValueSemantics) and RefinePublicReturn passes to torch dialect. - The TorchToStd and TorchToLinalg passes are now type conversions from `!torch.vtensor` to `tensor` and use the dialect conversion infra. The overall conversion pipeline is set up following the best practices of the "Type Conversions the Not-So-Hard Way" talk. This required introducing `torch-func-builtin-tensorize` and `torch-finalizing-builtin-tensorize` passes analogous to the upstream bufferization passes with the corresponding names (mostly just copypasta from there). - Misc Torch-level canonicalizations -- we now cleanly layer the lowering to std later in the pipeline, so we are gradually lessening our reliance on random std constant folding before we get to that point. Recommended review order: - New types in TorchTypes.td/TorchTypes.h/TorchDialect.cpp - New ops in TorchOps.td / TorchOps.cpp - Less important / more mechanical stuff - Frontend changes. - Pass changes/additions in `Torch/Transforms` and `Conversion/` 2021-05-21 08:07:18 +08:00			`// RUN: npcomp-opt %s -torch-func-builtin-tensorize -split-input-file -verify-diagnostics -allow-unregistered-dialect \| FileCheck %s`

			// This test is largely copied from `func-bufferize` upstream, as it covers
			`// the same scope.`

			`// CHECK-LABEL: func @identity(`
			`// CHECK-SAME: %[[ARG:.*]]: tensor<f32>) -> tensor<f32> {`
			`// CHECK: %[[TENSOR:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>`
			`// CHECK: %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>`
			`// CHECK: return %[[MEMREF]] : tensor<f32>`
			`func @identity(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {`
			`return %arg0 : !torch.vtensor<[],f32>`
			`}`

			`// CHECK-LABEL: func @block_arguments(`
			`// CHECK-SAME: %[[ARG:.*]]: tensor<f32>) -> tensor<f32> {`
			`// CHECK: %[[T1:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>`
			`// CHECK: %[[M1:.*]] = torch.to_builtin_tensor %[[T1]] : !torch.vtensor<[],f32> -> tensor<f32>`
			`// CHECK: br ^bb1(%[[M1]] : tensor<f32>)`
			`// CHECK: ^bb1(%[[BBARG:.*]]: tensor<f32>):`
			`// CHECK: %[[T2:.*]] = torch.from_builtin_tensor %[[BBARG]] : tensor<f32> -> !torch.vtensor<[],f32>`
			`// CHECK: %[[M2:.*]] = torch.to_builtin_tensor %[[T2]] : !torch.vtensor<[],f32> -> tensor<f32>`
			`// CHECK: return %[[M2]] : tensor<f32>`
			`func @block_arguments(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {`
			`br ^bb1(%arg0: !torch.vtensor<[],f32>)`
			`^bb1(%bbarg: !torch.vtensor<[],f32>):`
			`return %bbarg : !torch.vtensor<[],f32>`
			`}`

			`// CHECK-LABEL: func private @source() -> tensor<f32>`
			`// CHECK-LABEL: func @call_source() -> tensor<f32> {`
			`// CHECK: %[[RET:.*]] = call @source() : () -> tensor<f32>`
			`// CHECK: return %[[RET]] : tensor<f32>`
			`func private @source() -> !torch.vtensor<[],f32>`
			`func @call_source() -> !torch.vtensor<[],f32> {`
			`%0 = call @source() : () -> !torch.vtensor<[],f32>`
			`return %0 : !torch.vtensor<[],f32>`
			`}`
			`// CHECK-LABEL: func @call_sink(`
			`// CHECK-SAME: %[[ARG:.*]]: tensor<f32>) {`
			`// CHECK: %[[TENSOR:.*]] = torch.from_builtin_tensor %[[ARG]] : tensor<f32> -> !torch.vtensor<[],f32>`
			`// CHECK: %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>`
			`// CHECK: call @sink(%[[MEMREF]]) : (tensor<f32>) -> ()`
			`// CHECK: return`
			`func private @sink(!torch.vtensor<[],f32>)`
			`func @call_sink(%arg0: !torch.vtensor<[],f32>) {`
			`call @sink(%arg0) : (!torch.vtensor<[],f32>) -> ()`
			`return`
			`}`

			`// CHECK-LABEL: func @unconverted_op_in_body() -> tensor<f32> {`
			`// CHECK: %[[TENSOR:.*]] = "test.source"() : () -> !torch.vtensor<[],f32>`
			`// CHECK: %[[MEMREF:.*]] = torch.to_builtin_tensor %[[TENSOR]] : !torch.vtensor<[],f32> -> tensor<f32>`
			`// CHECK: return %[[MEMREF]] : tensor<f32>`
			`func @unconverted_op_in_body() -> !torch.vtensor<[],f32> {`
			`%0 = "test.source"() : () -> !torch.vtensor<[],f32>`
			`return %0 : !torch.vtensor<[],f32>`
			`}`

			`// -----`

			`// Because this pass updates block arguments, it needs to also atomically`
			`// update all terminators and issue an error if that is not possible.`
			`func @unable_to_update_terminator(%arg0: !torch.vtensor<[],f32>) -> !torch.vtensor<[],f32> {`
			`%0 = constant true`
			`cond_br %0, ^bb1(%arg0: !torch.vtensor<[],f32>), ^bb2(%arg0: !torch.vtensor<[],f32>)`
			`^bb1(%bbarg0: !torch.vtensor<[],f32>):`
			`// expected-error @+1 {{failed to legalize operation 'test.terminator'}}`
			`"test.terminator"() : () -> ()`
			`^bb2(%bbarg1: !torch.vtensor<[],f32>):`
			`return %bbarg1 : !torch.vtensor<[],f32>`
			`}`

			`// -----`

			`// There was a bug in func-bufferize pass which caused terminators without`
			`// ReturnLike and BranchOpInterface traits (e.g. scf.condition) to always`
			`// fail to legalize even if bufferization doesn't needed.`
			`// Check the pass succedeed.`
			`// CHECK: while`
			`// CHECK: scf.while`
			`// CHECK: scf.condition`
			`func @bwhile(%arg0: i64, %arg1: i64) -> i64 {`
			`%c2_i64 = constant 2 : i64`
			`%0:2 = scf.while (%arg2 = %arg0) : (i64) -> (i64, i64) {`
			`%1 = cmpi slt, %arg2, %arg1 : i64`
			`scf.condition(%1) %arg2, %arg2 : i64, i64`
			`} do {`
			`^bb0(%arg2: i64, %arg3: i64):`
			`%1 = muli %arg3, %c2_i64 : i64`
			`scf.yield %1 : i64`
			`}`
			`return %0#1 : i64`
			`}`