torch-mlir/frontends/pytorch/e2e_testing/torchscript/elementwise.py

#  Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
#  See https://llvm.org/LICENSE.txt for license information.
#  SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

import torch

from torch_mlir_torchscript.e2e_test.framework import TestUtils
from torch_mlir_torchscript.e2e_test.registry import register_test_case
from torch_mlir_torchscript.annotations import annotate_args, export

# TODO: Support scalar !torch.int/!torch.float variants. Add support to
# ReduceOpVariants to implement them in terms of the tensor-only variants +
# torch.prim.NumToTensor.

# TODO: This is pretty verbose. Can we have a helper to reduce
# the boilerplate?

# ==============================================================================


class ElementwiseUnaryModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1, -1], torch.float32, True),
    ])
    def forward(self, a):
        return torch.tanh(a)


@register_test_case(module_factory=lambda: ElementwiseUnaryModule())
def ElementwiseUnaryModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(3, 4))


# ==============================================================================


class ElementwiseBinaryModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1, -1], torch.float32, True),
        ([-1], torch.float32, True),
    ])
    def forward(self, a, b):
        return a * b


@register_test_case(module_factory=lambda: ElementwiseBinaryModule())
def ElementwiseBinaryModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(3, 4), tu.rand(4))


# ==============================================================================


class ElementwiseTernaryModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1, -1, -1], torch.float32, True),
        ([-1, -1], torch.float32, True),
        ([-1], torch.float32, True),
    ])
    def forward(self, a, b, c):
        return torch.lerp(a, b, c)


@register_test_case(module_factory=lambda: ElementwiseTernaryModule())
def ElementwiseTernaryModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(3, 4, 5), tu.rand(4, 5), tu.rand(5))


# ==============================================================================


# Addition is an interesting special case of a binary op, because under the hood
# it carries a third scalar "alpha" parameter, which needs special handling.
class ElementwiseAddModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1], torch.float32, True),
        ([], torch.float32, True),
    ])
    def forward(self, a, b):
        return a + b


@register_test_case(module_factory=lambda: ElementwiseAddModule())
def ElementwiseAddModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(4), tu.rand())


# ==============================================================================


class ElementwiseUnsqueezeBroadcastModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1], torch.float32, True),
        ([], torch.float32, True),
    ])
    def forward(self, a, b):
        return a * b.unsqueeze(0)


@register_test_case(
    module_factory=lambda: ElementwiseUnsqueezeBroadcastModule())
def ElementwiseUnsqueezeBroadcastModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(4), tu.rand())


# ==============================================================================


class ElementwiseFlattenBroadcastModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1], torch.float32, True),
        ([], torch.float32, True),
    ])
    def forward(self, a, b):
        return a * b.flatten(-1, -1)


@register_test_case(module_factory=lambda: ElementwiseFlattenBroadcastModule())
def ElementwiseFlattenBroadcastModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(6), tu.rand())

# ==============================================================================


class ElementwiseReluModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1, -1], torch.float32, True),
    ])
    def forward(self, x):
        return torch.relu(x)


@register_test_case(module_factory=lambda: ElementwiseReluModule())
def ElementwiseReluModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(4, 2) - 0.5)

# ==============================================================================


class ElementwiseSigmoidModule(torch.nn.Module):
    def __init__(self):
        super().__init__()

    @export
    @annotate_args([
        None,
        ([-1, -1], torch.float32, True),
    ])
    def forward(self, x):
        return torch.sigmoid(x)


@register_test_case(module_factory=lambda: ElementwiseSigmoidModule())
def ElementwiseSigmoidModule_basic(module, tu: TestUtils):
    module.forward(tu.rand(3, 5))
Generalize support for elementwise ops. We plumb through e2e a fair number of interesting cases: - unary, binary, ternary elementwise ops - ops like `torch.aten.add.Tensor` that also take a scalar parameter - static size-1 broadcasting We allow the static size-1 broadcasting case, but emit a runtime error in the case of dynamic size-1 broadcasting. This seems like a sweet spot subset of things that can be lowered directly to linalg, while not being overly constraining to users. This is consistent with what IREE is doing for CHLO->Linalg lowering as well ([code](https://github.com/google/iree/blob/50bf7a87e465d2048c527bc27724edde40519b7e/iree/compiler/InputConversion/MHLO/BroadcastingToLinalgPatterns.cpp#L1)). To test the static size-1 case, we added support for the `torch.aten.unsqueeze` op and lowering for it through `linalg.tensor_expand_shape`. This involved a generalization of `MaximizeValueSemantics` able to handle it (the solution there also works for `torch.aten.flatten.using_ints` which we need for ResNet anyway) Also, a few minor additional changes: - Add `VerifyInvariantsBeforeBackendLowering` pass, which catches a large class of errors before we get to backend lowering (now that we are doing dialect conversion, the errors are way nicer if we just emit them up front rather than in the guts of a random pattern). - Minor change to RefBackend to allow `linalg.tensor_expand_shape`. Recommended review order: - e2e tests in elementwise.py - `ConvertElementwiseOp` in TorchToLinalg.cpp + elementwise.mlir test - `ConvertAtenUnsqueezeOp` in TorchToLinalg.cpp + unsqueeze.mlir test - RefineTypes.cpp + tests - MaximizeValueSemantics changes + test - VerifyInvariantsBeforeBackendLowering pass + test 2021-06-26 08:25:09 +08:00			`# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.`
			`# See https://llvm.org/LICENSE.txt for license information.`
			`# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception`

			`import torch`

Add E2E support for tests with heavy dependencies (heavydep tests). The tests use the same (pure-Python) test framework as the normal torchscript_e2e_test.sh, but the tests are added in `build_tools/torchscript_e2e_heavydep_tests` instead of `frontends/pytorch/e2e_testing/torchscript`. Any needed dependencies can easily be configured in generate_serialized_tests.sh. We add an initial machine translation model with a complex set of dependencies to seed the curriculum there. I verified that this model gets to the point of MLIR import (it fails there with a segfault due to not being able to import the "Any" type). This required moving a few files from the `torch_mlir` Python module into multiple modules to isolate the code that depends on our C++ extensions (which now live in `torch_mlir` and `torch_mlir_torchscript_e2e_test_configs`) from the pure Python code (which now lives in `torch_mlir_torchscript`). This is an entirely mechanical change, and lots of imports needed to be updated. The dependency graph is: ``` torch_mlir_torchscript_e2e_test_configs / \| / \| / \| V V torch_mlir_torchscript torch_mlir ``` The `torch_mlir_torchscript_e2e_test_configs` are then dependency-injected into the `torch_mlir_torchscript` modules to successfully assemble a working test harness (the code was already structured this way, but this new file organization allows the isolation from C++ code to actually happen). This isolation is critical to allowing the serialized programs to be transported across PyTorch versions and for the test harness to be used seamlessly to generate the heavydep tests. Also: - Extend `_Tracer` class to support nested property (submodule) accesses. Recommended review order: - "user-level" docs in README.md - code in `build_tools/torchscript_e2e_heavydep_tests`. - changes in `torch_mlir_torchscript/e2e_test/framework.py` - misc mechanical changes. 2021-07-10 03:22:45 +08:00			`from torch_mlir_torchscript.e2e_test.framework import TestUtils`
			`from torch_mlir_torchscript.e2e_test.registry import register_test_case`
			`from torch_mlir_torchscript.annotations import annotate_args, export`
Generalize support for elementwise ops. We plumb through e2e a fair number of interesting cases: - unary, binary, ternary elementwise ops - ops like `torch.aten.add.Tensor` that also take a scalar parameter - static size-1 broadcasting We allow the static size-1 broadcasting case, but emit a runtime error in the case of dynamic size-1 broadcasting. This seems like a sweet spot subset of things that can be lowered directly to linalg, while not being overly constraining to users. This is consistent with what IREE is doing for CHLO->Linalg lowering as well ([code](https://github.com/google/iree/blob/50bf7a87e465d2048c527bc27724edde40519b7e/iree/compiler/InputConversion/MHLO/BroadcastingToLinalgPatterns.cpp#L1)). To test the static size-1 case, we added support for the `torch.aten.unsqueeze` op and lowering for it through `linalg.tensor_expand_shape`. This involved a generalization of `MaximizeValueSemantics` able to handle it (the solution there also works for `torch.aten.flatten.using_ints` which we need for ResNet anyway) Also, a few minor additional changes: - Add `VerifyInvariantsBeforeBackendLowering` pass, which catches a large class of errors before we get to backend lowering (now that we are doing dialect conversion, the errors are way nicer if we just emit them up front rather than in the guts of a random pattern). - Minor change to RefBackend to allow `linalg.tensor_expand_shape`. Recommended review order: - e2e tests in elementwise.py - `ConvertElementwiseOp` in TorchToLinalg.cpp + elementwise.mlir test - `ConvertAtenUnsqueezeOp` in TorchToLinalg.cpp + unsqueeze.mlir test - RefineTypes.cpp + tests - MaximizeValueSemantics changes + test - VerifyInvariantsBeforeBackendLowering pass + test 2021-06-26 08:25:09 +08:00
			`# TODO: Support scalar !torch.int/!torch.float variants. Add support to`
			`# ReduceOpVariants to implement them in terms of the tensor-only variants +`
			`# torch.prim.NumToTensor.`

			`# TODO: This is pretty verbose. Can we have a helper to reduce`
			`# the boilerplate?`

			`# ==============================================================================`


			`class ElementwiseUnaryModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1, -1], torch.float32, True),`
			`])`
			`def forward(self, a):`
			`return torch.tanh(a)`


			`@register_test_case(module_factory=lambda: ElementwiseUnaryModule())`
			`def ElementwiseUnaryModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(3, 4))`


			`# ==============================================================================`


			`class ElementwiseBinaryModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1, -1], torch.float32, True),`
			`([-1], torch.float32, True),`
			`])`
			`def forward(self, a, b):`
			`return a * b`


			`@register_test_case(module_factory=lambda: ElementwiseBinaryModule())`
			`def ElementwiseBinaryModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(3, 4), tu.rand(4))`


			`# ==============================================================================`


			`class ElementwiseTernaryModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1, -1, -1], torch.float32, True),`
			`([-1, -1], torch.float32, True),`
			`([-1], torch.float32, True),`
			`])`
			`def forward(self, a, b, c):`
			`return torch.lerp(a, b, c)`


			`@register_test_case(module_factory=lambda: ElementwiseTernaryModule())`
			`def ElementwiseTernaryModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(3, 4, 5), tu.rand(4, 5), tu.rand(5))`


			`# ==============================================================================`


			`# Addition is an interesting special case of a binary op, because under the hood`
			`# it carries a third scalar "alpha" parameter, which needs special handling.`
			`class ElementwiseAddModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1], torch.float32, True),`
			`([], torch.float32, True),`
			`])`
			`def forward(self, a, b):`
			`return a + b`


			`@register_test_case(module_factory=lambda: ElementwiseAddModule())`
			`def ElementwiseAddModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(4), tu.rand())`


			`# ==============================================================================`


			`class ElementwiseUnsqueezeBroadcastModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1], torch.float32, True),`
			`([], torch.float32, True),`
			`])`
			`def forward(self, a, b):`
			`return a * b.unsqueeze(0)`


			`@register_test_case(`
			`module_factory=lambda: ElementwiseUnsqueezeBroadcastModule())`
			`def ElementwiseUnsqueezeBroadcastModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(4), tu.rand())`


			`# ==============================================================================`


Add torch.aten.flatten.using_ints and aten.MaxPool2d linalg lowering - torch.aten.flatten.using_ints to linalg lowering - torch.aten.max_pool2d to linalg lowering - Support torch.aten.conv2d for more flexible dilation and strides values 2021-07-08 04:59:47 +08:00			`class ElementwiseFlattenBroadcastModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1], torch.float32, True),`
			`([], torch.float32, True),`
			`])`
			`def forward(self, a, b):`
			`return a * b.flatten(-1, -1)`


			`@register_test_case(module_factory=lambda: ElementwiseFlattenBroadcastModule())`
			`def ElementwiseFlattenBroadcastModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(6), tu.rand())`

			`# ==============================================================================`


Generalize support for elementwise ops. We plumb through e2e a fair number of interesting cases: - unary, binary, ternary elementwise ops - ops like `torch.aten.add.Tensor` that also take a scalar parameter - static size-1 broadcasting We allow the static size-1 broadcasting case, but emit a runtime error in the case of dynamic size-1 broadcasting. This seems like a sweet spot subset of things that can be lowered directly to linalg, while not being overly constraining to users. This is consistent with what IREE is doing for CHLO->Linalg lowering as well ([code](https://github.com/google/iree/blob/50bf7a87e465d2048c527bc27724edde40519b7e/iree/compiler/InputConversion/MHLO/BroadcastingToLinalgPatterns.cpp#L1)). To test the static size-1 case, we added support for the `torch.aten.unsqueeze` op and lowering for it through `linalg.tensor_expand_shape`. This involved a generalization of `MaximizeValueSemantics` able to handle it (the solution there also works for `torch.aten.flatten.using_ints` which we need for ResNet anyway) Also, a few minor additional changes: - Add `VerifyInvariantsBeforeBackendLowering` pass, which catches a large class of errors before we get to backend lowering (now that we are doing dialect conversion, the errors are way nicer if we just emit them up front rather than in the guts of a random pattern). - Minor change to RefBackend to allow `linalg.tensor_expand_shape`. Recommended review order: - e2e tests in elementwise.py - `ConvertElementwiseOp` in TorchToLinalg.cpp + elementwise.mlir test - `ConvertAtenUnsqueezeOp` in TorchToLinalg.cpp + unsqueeze.mlir test - RefineTypes.cpp + tests - MaximizeValueSemantics changes + test - VerifyInvariantsBeforeBackendLowering pass + test 2021-06-26 08:25:09 +08:00			`class ElementwiseReluModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1, -1], torch.float32, True),`
			`])`
			`def forward(self, x):`
			`return torch.relu(x)`


			`@register_test_case(module_factory=lambda: ElementwiseReluModule())`
			`def ElementwiseReluModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(4, 2) - 0.5)`
Add sigmoid lowering Follows existing conventions for activation functions 2021-08-30 10:03:38 +08:00
			`# ==============================================================================`


			`class ElementwiseSigmoidModule(torch.nn.Module):`
			`def __init__(self):`
			`super().__init__()`

			`@export`
			`@annotate_args([`
			`None,`
			`([-1, -1], torch.float32, True),`
			`])`
			`def forward(self, x):`
			`return torch.sigmoid(x)`


			`@register_test_case(module_factory=lambda: ElementwiseSigmoidModule())`
			`def ElementwiseSigmoidModule_basic(module, tu: TestUtils):`
			`module.forward(tu.rand(3, 5))`