Remove eager_mode

This was an experimental attempt at rolling out own op-by-op executor with `__torch_dispatch__`, but it proved difficult to make it robust. Op-by-op execution is very easy to implement robustly now with the PyTorch 2.0 stack, so we don't need eager_mode. Downstream users were using eager_mode to implement lockstep numerical accuracy debuggers. We implemented the same functionality with TorchDynamo in https://github.com/llvm/torch-mlir/pull/1681 so now there is not much reason to continue maintaining it.
2022-12-08 14:54:22 +00:00 · 2022-12-08 14:54:22 +00:00 · 7731211d02
parent 109c91ae9b
commit 7731211d02
19 changed files with 2 additions and 1565 deletions
--- a/README.md
+++ b/README.md
@ -75,14 +75,6 @@ torch-mlir prediction

 View examples [here](docs/ltc_examples.md).

-### Eager Mode
-
-Eager mode with TorchMLIR is a very experimental eager mode backend for PyTorch through the torch-mlir framework. 
-Effectively, this mode works by compiling operator by operator as the NN is eagerly executed by PyTorch. 
-This mode includes a fallback to conventional PyTorch if anything in the torch-mlir compilation process fails (e.g., unsupported operator).
-A simple example can be found at [eager_mode.py](examples/eager_mode.py).
-A ResNet18 example can be found at [eager_mode_resnet18.py](examples/eager_mode_resnet18.py).
-
 ## Repository Layout

 The project follows the conventions of typical MLIR-based projects:
--- a/build_tools/python_deploy/build_linux_packages.sh
+++ b/build_tools/python_deploy/build_linux_packages.sh
@ -262,9 +262,6 @@ function test_in_tree() {
  echo ":::: Run Linalg e2e integration tests"
  python -m e2e_testing.main --config=linalg -v

-  echo ":::: Run eager_mode e2e integration tests"
-  python -m e2e_testing.main --config=eager_mode -v
-
  echo ":::: Run MHLO e2e integration tests"
  python -m e2e_testing.main --config=mhlo -v

--- a/e2e_testing/main.py
+++ b/e2e_testing/main.py
@ -20,7 +20,6 @@ from torch_mlir_e2e_test.configs import (
    NativeTorchTestConfig,
    TorchScriptTestConfig,
    TosaBackendTestConfig,
-    EagerModeTestConfig,
    TorchDynamoTestConfig,
 )

@ -28,14 +27,14 @@ from torch_mlir_e2e_test.linalg_on_tensors_backends.refbackend import RefBackend
 from torch_mlir_e2e_test.mhlo_backends.linalg_on_tensors import LinalgOnTensorsMhloBackend
 from torch_mlir_e2e_test.tosa_backends.linalg_on_tensors import LinalgOnTensorsTosaBackend

-from .xfail_sets import LINALG_XFAIL_SET, MHLO_PASS_SET, TOSA_PASS_SET, EAGER_MODE_XFAIL_SET, LTC_XFAIL_SET, TORCHDYNAMO_XFAIL_SET
+from .xfail_sets import LINALG_XFAIL_SET, MHLO_PASS_SET, TOSA_PASS_SET, LTC_XFAIL_SET, TORCHDYNAMO_XFAIL_SET

 # Import tests to register them in the global registry.
 from torch_mlir_e2e_test.test_suite import register_all_tests
 register_all_tests()

 def _get_argparse():
-    config_choices = ['native_torch', 'torchscript', 'linalg', 'mhlo', 'tosa', 'eager_mode', 'lazy_tensor_core', 'torchdynamo']
+    config_choices = ['native_torch', 'torchscript', 'linalg', 'mhlo', 'tosa', 'lazy_tensor_core', 'torchdynamo']
    parser = argparse.ArgumentParser(description='Run torchscript e2e tests.')
    parser.add_argument('-c', '--config',
        choices=config_choices,
@ -47,7 +46,6 @@ Meaning of options:
 "tosa": run through torch-mlir's default TOSA backend.
 "native_torch": run the torch.nn.Module as-is without compiling (useful for verifying model is deterministic; ALL tests should pass in this configuration).
 "torchscript": compile the model to a torch.jit.ScriptModule, and then run that as-is (useful for verifying TorchScript is modeling the program correctly).
-"eager_mode": run through torch-mlir's eager mode frontend, using Linalg-on-Tensors for execution.
 "lazy_tensor_core": run the model through the Lazy Tensor Core frontend and execute the traced graph.
 "torchdynamo": run the model through the TorchDynamo frontend and execute the graph using Linalg-on-Tensors.
 ''')
@ -91,9 +89,6 @@ def main():
    elif args.config == 'torchscript':
        config = TorchScriptTestConfig()
        xfail_set = {}
-    elif args.config == 'eager_mode':
-        config = EagerModeTestConfig()
-        xfail_set = EAGER_MODE_XFAIL_SET
    elif args.config == 'lazy_tensor_core':
        config = LazyTensorCoreTestConfig()
        xfail_set = LTC_XFAIL_SET
--- a/e2e_testing/xfail_sets.py
+++ b/e2e_testing/xfail_sets.py
@ -14,13 +14,6 @@ from torch_mlir_e2e_test.test_suite import COMMON_TORCH_MLIR_LOWERING_XFAILS

 LINALG_XFAIL_SET = COMMON_TORCH_MLIR_LOWERING_XFAILS

-EAGER_MODE_XFAIL_SET = COMMON_TORCH_MLIR_LOWERING_XFAILS | {
-    # RefBackend fails for some reason.
-    # These tests pass in the regular RefBackend flow, so it's unclear
-    # why they fail here.
-    "Matmul_vecmat",
-}
-
 TORCHDYNAMO_XFAIL_SET = {
    #### General TorchDynamo/PyTorch errors

--- a/examples/eager_mode.py
+++ b/examples/eager_mode.py
@ -1,34 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-import torch
-
-from torch_mlir.eager_mode.torch_mlir_tensor import TorchMLIRTensor
-
-torch_a = torch.randn(5, requires_grad=True)
-torch_b = torch.randn(5, requires_grad=True)
-
-torch_c = torch_a + torch_b
-torch_d = torch_a * torch_b
-torch_e = torch_c / torch_d
-torch_loss = torch_e.sum()
-print("PyTorch loss: ", torch_loss)
-
-torch_loss.backward()
-print("PyTorch grad a: ", torch_a.grad)
-print("PyTorch grad b: ", torch_b.grad)
-
-a = TorchMLIRTensor(torch_a)
-b = TorchMLIRTensor(torch_b)
-
-c = a + b
-d = a * b
-e = c / d
-loss = e.sum()
-print("Torch-MLIR loss: ", loss)
-
-loss.backward()
-print("Torch-MLIR grad a: ", a.grad)
-print("Torch-MLIR grad b: ", b.grad)
--- a/examples/eager_mode_resnet18.py
+++ b/examples/eager_mode_resnet18.py
@ -1,89 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-import sys
-
-import requests
-import torch
-import torchvision.models as models
-from PIL import Image
-from torchvision import transforms
-
-from torch_mlir.eager_mode.torch_mlir_tensor import TorchMLIRTensor
-
-
-def load_and_preprocess_image(url: str):
-    headers = {
-        'User-Agent':
-        'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36'
-    }
-    img = Image.open(requests.get(url, headers=headers,
-                                  stream=True).raw).convert("RGB")
-    # preprocessing pipeline
-    preprocess = transforms.Compose([
-        transforms.Resize(256),
-        transforms.CenterCrop(224),
-        transforms.ToTensor(),
-        transforms.Normalize(mean=[0.485, 0.456, 0.406],
-                             std=[0.229, 0.224, 0.225]),
-    ])
-    img_preprocessed = preprocess(img)
-    return torch.unsqueeze(img_preprocessed, 0)
-
-
-def load_labels():
-    classes_text = requests.get(
-        "https://raw.githubusercontent.com/cathyzhyi/ml-data/main/imagenet-classes.txt",
-        stream=True,
-    ).text
-    labels = [line.strip() for line in classes_text.splitlines()]
-    return labels
-
-
-def top3_possibilities(res):
-    _, indexes = torch.sort(res, descending=True)
-    percentage = torch.nn.functional.softmax(res, dim=1)[0] * 100
-    top3 = [(labels[idx], percentage[idx].item()) for idx in indexes[0][:3]]
-    return top3
-
-
-def predictions(torch_func, img, labels):
-    golden_prediction = top3_possibilities(torch_func(img))
-    print("PyTorch prediction")
-    print(golden_prediction)
-    prediction = top3_possibilities(torch_func(TorchMLIRTensor(img)))
-    print("torch-mlir prediction")
-    print(prediction)
-
-
-class ResNet18Module(torch.nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.resnet = models.resnet18(pretrained=True)
-        self.train(False)
-
-    def forward(self, img):
-        return self.resnet.forward(img)
-
-
-class TestModule(torch.nn.Module):
-    def __init__(self):
-        super().__init__()
-        self.s = ResNet18Module()
-
-    def forward(self, x):
-        return self.s.forward(x)
-
-
-image_url = (
-    "https://upload.wikimedia.org/wikipedia/commons/2/26/YellowLabradorLooking_new.jpg"
-)
-
-print("load image from " + image_url, file=sys.stderr)
-img = load_and_preprocess_image(image_url)
-labels = load_labels()
-
-test_module = TestModule()
-predictions(test_module.forward, img, labels)
--- a/python/CMakeLists.txt
+++ b/python/CMakeLists.txt
@ -102,12 +102,6 @@ if(TORCH_MLIR_ENABLE_JIT_IR_IMPORTER)
  add_subdirectory(torch_mlir_e2e_test)
 endif()

-################################################################################
-# Eager mode
-################################################################################
-
-add_subdirectory(torch_mlir/eager_mode)
-
 ################################################################################
 # Custom op example
 # Required for running the update_torch_ods.sh and update_shape_lib.sh scripts.
--- a/python/test/eager_mode/build_script_function.py
+++ b/python/test/eager_mode/build_script_function.py
@ -1,320 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-# RUN: %PYTHON %s | FileCheck %s
-
-
-import torch
-
-from framework import run_test
-from torch_mlir.eager_mode.ir_building import build_ts_script_function
-
-
-# CHECK: graph(%[[A1:.*]] : Tensor,
-# CHECK:  %[[A2:.*]] : Tensor,
-# CHECK:  %[[A3:.*]] : Tensor):
-# CHECK:  %[[A4:.*]] : int = prim::Constant[value=1]()
-# CHECK:  %[[A5:.*]] : int = prim::Constant[value=1]()
-# CHECK:  %[[A0:.*]] : Tensor = aten::addmm(%[[A1]], %[[A2]], %[[A3]], %[[A4]], %[[A5]])
-# CHECK:  return (%[[A0]])
-# -----
-# CHECK: PASS - simple
-@run_test
-def simple():
-    target = torch.ops.aten.addmm.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        mat1=torch.randn(1, 3, 32, 32),
-        mat2=torch.randn(1, 3, 32, 32),
-        beta=1,
-        alpha=1,
-    )
-
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: graph(%[[B1:.*]] : Tensor,
-# CHECK:  %[[B2:.*]] : Tensor,
-# CHECK:  %[[B3:.*]] : Tensor):
-# CHECK:  %[[B4:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %[[B5:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %[[B6:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %[[B7:.*]] : bool = prim::Constant[value=0]()
-# CHECK:  %[[B8:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %[[B9:.*]] : int = prim::Constant[value=1]()
-# CHECK:  %[[B0:.*]] : Tensor = aten::convolution(%[[B1]], %[[B2]], %[[B3]], %[[B4]], %[[B5]], %[[B6]], %[[B7]], %[[B8]], %[[B9]])
-# CHECK:  return (%[[B0]])
-# -----
-# CHECK: PASS - handle_optional_tensor_input
-@run_test
-def handle_optional_tensor_input():
-    target = torch.ops.aten.convolution.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        weight=torch.randn(3, 3, 3, 3),
-        bias=torch.randn(3),
-        stride=[1, 1],
-        padding=[0, 0],
-        dilation=[1, 1],
-        transposed=False,
-        output_padding=[0, 0],
-        groups=1,
-    )
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: FAIL - fail_not_enough_args
-# CHECK: Errors:  'groups'
-@run_test
-def fail_not_enough_args():
-    target = torch.ops.aten.convolution.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        weight=torch.randn(3, 3, 3, 3),
-        bias=torch.randn(3),
-        stride=[1, 1],
-        padding=[0, 0],
-        dilation=[1, 1],
-        transposed=False,
-        output_padding=[0, 0],
-        # Missing groups=1,
-    )
-    build_ts_script_function(target._schema, kwargs)
-
-
-# CHECK: graph(%input : Tensor,
-# CHECK:  %weight : Tensor,
-# CHECK:  %bias : Tensor):
-# CHECK:  %4 : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %5 : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %6 : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %7 : bool = prim::Constant[value=0]()
-# CHECK:  %8 : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %9 : int = prim::Constant[value=1]()
-# CHECK:  %0 : Tensor = aten::convolution(%input, %weight, %bias, %4, %5, %6, %7, %8, %9)
-# CHECK:  return (%0)
-# -----
-# CHECK: PASS - simple_kwargs
-@run_test
-def simple_kwargs():
-    target = torch.ops.aten.convolution.default
-    script_fun1 = build_ts_script_function(
-        target._schema,
-        dict(
-            input=torch.randn(1, 3, 32, 32),
-            weight=torch.randn(3, 3, 3, 3),
-            bias=torch.randn(3),
-            stride=[1, 1],
-            padding=[0, 0],
-            dilation=[1, 1],
-            transposed=False,
-            output_padding=[0, 0],
-            groups=1,
-        ),
-    )
-
-    print(script_fun1.graph)
-
-
-# CHECK: graph(%[[C2:.*]] : Tensor):
-# CHECK:   %[[C3:.*]] : int[] = prim::Constant[value=[3, 3]]()
-# CHECK:   %[[C4:.*]] : NoneType = prim::Constant()
-# CHECK:   %[[C5:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:   %[[C6:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:   %[[C7:.*]] : bool = prim::Constant[value=0]()
-# CHECK:   %[[C0:.*]] : Tensor, %[[C1:.*]] : Tensor = aten::max_pool2d_with_indices(%[[C2]], %[[C3]], %[[C4]], %[[C5]], %[[C6]], %[[C7]])
-# CHECK:   return (%[[C0]], %[[C1]])
-# -----
-# CHECK: PASS - handle_empty_lists
-@run_test
-def handle_empty_lists():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    # print(target._schema)
-    input = torch.randn((1, 3, 32, 32))
-    kwargs = dict(
-        input=input,
-        kernel_size=[3, 3],
-        stride=[],
-        padding=[0, 0],
-        dilation=[1, 1],
-        ceil_mode=False,
-    )
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: graph(%[[D2:.*]] : Tensor):
-# CHECK:   %[[D3:.*]] : int[] = prim::Constant[value=[3, 3]]()
-# CHECK:   %[[D4:.*]] : NoneType = prim::Constant()
-# CHECK:   %[[D5:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:   %[[D6:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:   %[[D7:.*]] : bool = prim::Constant[value=0]()
-# CHECK:   %[[D0:.*]] : Tensor, %[[D1:.*]] : Tensor = aten::max_pool2d_with_indices(%[[D2]], %[[D3]], %[[D4]], %[[D5]], %[[D6]], %[[D7]])
-# CHECK:   return (%[[D0]], %[[D1]])
-# -----
-# CHECK: PASS - handle_nones
-@run_test
-def handle_nones():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    # print(target._schema)
-    kwargs = dict(
-        input=torch.randn((1, 3, 32, 32)),
-        kernel_size=[3, 3],
-        stride=None,
-        padding=[0, 0],
-        dilation=[1, 1],
-        ceil_mode=False,
-    )
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: graph(%[[E1:.*]] : Tensor,
-# CHECK:  %[[E2:.*]] : Tensor,
-# CHECK:  %[[E3:.*]] : Tensor):
-# CHECK:  %[[E4:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %[[E5:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %[[E6:.*]] : int[] = prim::Constant[value=[1, 1]]()
-# CHECK:  %[[E7:.*]] : bool = prim::Constant[value=0]()
-# CHECK:  %[[E8:.*]] : int[] = prim::Constant[value=[0, 0]]()
-# CHECK:  %[[E9:.*]] : int = prim::Constant[value=1]()
-# CHECK:  %[[E0:.*]] : Tensor = aten::convolution(%[[E1]], %[[E2]], %[[E3]], %[[E4]], %[[E5]], %[[E6]], %[[E7]], %[[E8]], %[[E9]])
-# CHECK:  return (%[[E0]])
-# -----
-# CHECK: PASS - handle_optional_tensors
-@run_test
-def handle_optional_tensors():
-    target = torch.ops.aten.convolution.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        weight=torch.randn(3, 3, 3, 3),
-        bias=torch.randn(3),
-        stride=[1, 1],
-        padding=[0, 0],
-        dilation=[1, 1],
-        transposed=False,
-        output_padding=[0, 0],
-        groups=1,
-    )
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: graph(%[[F1:.*]] : Tensor):
-# CHECK:  %[[F2:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[F3:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[F4:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[F5:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[F6:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[F0:.*]] : Tensor = aten::ones_like(%[[F1]], %[[F2]], %[[F3]], %[[F4]], %[[F5]], %[[F6]])
-# CHECK:  return (%[[F0]])
-# -----
-# CHECK: PASS - handle_ones_like
-@run_test
-def handle_ones_like():
-    target = torch.ops.aten.ones_like.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        dtype=None,
-        layout=None,
-        device=None,
-        pin_memory=None,
-        memory_format=None,
-    )
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: graph(%[[G3:.*]] : Tensor,
-# CHECK:  %[[G4:.*]] : Tensor,
-# CHECK:  %[[G5:.*]] : Tensor):
-# CHECK:  %[[G6:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[G7:.*]] : NoneType = prim::Constant()
-# CHECK:  %[[G8:.*]] : bool = prim::Constant[value=0]()
-# CHECK:  %[[G9:.*]] : float = prim::Constant[value=1.]()
-# CHECK:  %[[G10:.*]] : float = prim::Constant[value=1.]()
-# CHECK:  %[[G0:.*]] : Tensor, %[[G1:.*]] : Tensor, %[[G2:.*]] : Tensor = aten::native_batch_norm(%[[G3]], %[[G4]], %[[G5]], %[[G6]], %[[G7]], %[[G8]], %[[G9]], %[[G10]])
-# CHECK:  return (%[[G0]], %[[G1]], %[[G2]])
-# -----
-# CHECK: PASS - handle_multiple_outputs
-@run_test
-def handle_multiple_outputs():
-    target = torch.ops.aten.native_batch_norm.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        weight=torch.randn(1, 3, 32, 32),
-        bias=torch.randn(1, 3, 32, 32),
-        running_mean=None,
-        running_var=None,
-        training=False,
-        momentum=1.0,
-        eps=1.0
-    )
-
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
-
-
-# CHECK: f
-# CHECK: PASS - check_legal_name
-@run_test
-def check_legal_name():
-    target = torch.ops.aten.native_batch_norm.default
-    kwargs = dict(
-        input=torch.randn(1, 3, 32, 32),
-        weight=torch.randn(1, 3, 32, 32),
-        bias=torch.randn(1, 3, 32, 32),
-        running_mean=None,
-        running_var=None,
-        training=False,
-        momentum=1.0,
-        eps=1.0
-    )
-
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.name)
-
-
-# CHECK: graph(%[[H3:.*]] : Tensor,
-# CHECK:  %[[H4:.*]] : Tensor,
-# CHECK:  %[[H5:.*]] : Tensor,
-# CHECK:  %[[H6:.*]] : Tensor,
-# CHECK:  %[[H7:.*]] : Tensor,
-# CHECK:  %out : Tensor,
-# CHECK:  %save_mean : Tensor,
-# CHECK:  %save_invstd : Tensor):
-# CHECK:  %[[H8:.*]] : bool = prim::Constant[value=0]()
-# CHECK:  %[[H9:.*]] : float = prim::Constant[value=0.10000000000000001]()
-# CHECK:  %[[H10:.*]] : float = prim::Constant[value=0.0001]()
-# CHECK:  %[[H0:.*]] : Tensor, %[[H1:.*]] : Tensor, %[[H2:.*]] : Tensor = aten::native_batch_norm(%[[H3]], %[[H4]], %[[H5]], %[[H6]], %[[H7]], %[[H8]], %[[H9]], %[[H10]], %out, %save_mean, %save_invstd)
-# CHECK:  return (%[[H0]], %[[H1]], %[[H2]])
-# -----
-# CHECK: PASS - correctly_order_kwargs
-@run_test
-def correctly_order_kwargs():
-    target = torch.ops.aten.native_batch_norm.out
-
-    input = torch.randn(2, 5, 2, 3)
-    running_mean = torch.randn(5)
-    running_var = torch.randn(5)
-
-    kwargs = dict(
-        input=torch.randn(2, 5, 2, 3),
-        weight=torch.randn(5),
-        bias=torch.randn(5),
-        running_mean=running_mean,
-        running_var=running_var,
-        training=False,
-        momentum=0.1,
-        eps=0.0001,
-        out=torch.empty_like(input),
-        save_mean=torch.empty_like(running_mean),
-        save_invstd=torch.empty_like(running_var),
-    )
-
-    script_fun = build_ts_script_function(target._schema, kwargs)
-    print(script_fun.graph)
--- a/python/test/eager_mode/framework.py
+++ b/python/test/eager_mode/framework.py
@ -1,23 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-# RUN: true
-
-
-def run_test(*args, XPASS=False, XFAIL=False):
-    def _run_test(test):
-        test_name = test.__name__
-        try:
-            test()
-            print(("X" if XPASS else "") + f"PASS - {test_name}")
-        except Exception as e:
-            print(("X" if XFAIL else "") + f"FAIL - {test_name}")
-            print("Errors: ", e)
-        print()
-
-    if len(args):
-        _run_test(args[0])
-    else:
-        return _run_test
--- a/python/test/eager_mode/normalize_args_kwargs.py
+++ b/python/test/eager_mode/normalize_args_kwargs.py
@ -1,69 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-# RUN: %PYTHON %s | FileCheck %s
-
-
-import torch
-
-from framework import run_test
-from torch_mlir.eager_mode.torch_mlir_dispatch import normalize_args_kwargs
-
-
-# CHECK: PASS - should_normalize
-@run_test
-def should_normalize():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    input = torch.randn((1, 3, 32, 32))
-    kwargs = {"kernel_size": [3, 3]}
-    golden = {
-        "kernel_size": [3, 3],
-        # This is due to the schema for max_pool2d_with_indices defining
-        # the stride arg as int[2] stride=[].
-        "stride": [],
-        "padding": [0, 0],
-        "dilation": [1, 1],
-        "ceil_mode": False,
-    }
-
-    new_kwargs = normalize_args_kwargs(target, (input,), kwargs)
-    assert torch.allclose(new_kwargs["input"], input)
-    for k, v in new_kwargs.items():
-        if k == "input": continue
-        assert v == golden[k]
-
-
-# CHECK: FAIL - shouldnt_normalize1
-# CHECK: Errors: missing a required argument: 'kernel_size'
-@run_test
-def shouldnt_normalize1():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    args = (torch.randn((1, 3, 32, 32)),)
-    kwargs = {"stride": []}
-    normalize_args_kwargs(target, args, kwargs)
-
-
-# This next two tests are XPASS because of https://github.com/pytorch/pytorch/issues/75342
-# I.e., they should fail but in fact they pass because of the upstream bug.
-# The reason for the bug is a fast path branch in operator_schemas.normalize_function
-# that doesn't do rigorous type checking, and hence lets type mistmatches slip through.
-# TODO(max): change these to FAIL when the upstream bug is fixed.
-
-# CHECK: XPASS - shouldnt_normalize2
-@run_test(XPASS=True)
-def shouldnt_normalize2():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    args = (torch.randn((1, 3, 32, 32)),)
-    kwargs = {"kernel_size": []}
-    normalize_args_kwargs(target, args, kwargs)
-
-
-# CHECK: XPASS - shouldnt_normalize3
-@run_test(XPASS=True)
-def shouldnt_normalize3():
-    target = torch.ops.aten.max_pool2d_with_indices.default
-    args = (torch.randn((1, 3, 32, 32)),)
-    kwargs = {"kernel_size": [3, 3], "padding": None}
-    normalize_args_kwargs(target, args, kwargs)
--- a/python/torch_mlir/eager_mode/CMakeLists.txt
+++ b/python/torch_mlir/eager_mode/CMakeLists.txt
@ -1,11 +0,0 @@
-#-------------------------------------------------------------------------------
-# Subdirectories
-#-------------------------------------------------------------------------------
-
-## Declare the sources of the Python module.
-
-declare_mlir_python_sources(TorchMLIRPythonSources.EagerMode
-  ROOT_DIR "${TORCH_MLIR_PYTHON_ROOT_DIR}"
-  ADD_TO_PARENT TorchMLIRPythonSources
-  SOURCES_GLOB eager_mode/*.py lazytensor/*.py
-)
--- a/python/torch_mlir/eager_mode/init.py
+++ b/python/torch_mlir/eager_mode/init.py
@ -1,3 +0,0 @@
-import os
-
-EAGER_MODE_DEBUG = os.environ.get("EAGER_MODE_DEBUG", 'False').lower() in ('true', '1', 't')
--- a/python/torch_mlir/eager_mode/ir_building.py
+++ b/python/torch_mlir/eager_mode/ir_building.py
@ -1,359 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-"""
-Translator from torch.jit.ScriptFunction to MLIR.
-
-
-The following defines a set of classes for converting types used by Python and PyTorch into MLIR types from the
-`torch` dialect.
-
-The expected use of this module is to create an instance of one of the classes below, and then calling the
-`to_mlir` method to generate the MLIR representation of the type.
-
-Information about what types are supported by each class can be found in docstrings of each of the classes.
-
-In addition this module defines a function that take a torch.jit.ScriptFunction and converts it into an MLIR module.
-
-The expected use for this module is to use the function
-`build_module(jit_function: torch.jit.ScriptFunction annotation: Annotation) -> ir.Module`
-to convert the TorchScript function into MLIR using the `torch` dialect.
-"""
-
-import abc
-import re
-from typing import Any, Optional, Iterable, Dict
-from typing import Union
-
-import numpy as np
-import torch
-import torch._C
-import torch.jit
-from torch._ops import OpOverload
-
-from torch_mlir import ir
-from torch_mlir.dialects.func import FuncOp
-from torch_mlir.dialects.torch.importer.jit_ir import ModuleBuilder
-
-
-class TorchMlirType(abc.ABC):
-    """
-    A `TorchMlirType` is an object that produces MLIR
-    types in the `torch` dialect. The only requirement
-    for a class to be a subclass of `TorchMlirType`  is
-    to define a `to_mlir(self, ir.Context) -> ir.Type`.
-    Each class is allowed to have different types of
-    __init__ methods depending on the information they
-    require to produce the given MLIR representation.
-    """
-
-    @abc.abstractmethod
-    def to_mlir(self, context: ir.Context) -> ir.Type:
-        pass
-
-
-class TorchTensorTypeError(Exception):
-    def __init__(self, value: str):
-        super().__init__()
-        self.value = value
-
-    def __str__(self) -> str:
-        return self.value
-
-
-class TorchTensorType(TorchMlirType):
-    """
-    This class is used to generate types of the form
-    !torch.tensor and !torch.vtensor<SHAPE, DTYPE>,
-    where SHAPE is a list representing the shape of the tensor,
-    and DTYPE is an MLIR data type.
-    """
-
-    def __init__(
-        self,
-        *,
-        shape: Optional[Iterable[Optional[int]]] = None,
-        dtype: Optional[torch.dtype] = None,
-    ):
-        self.shape = shape
-        self.dtype = dtype
-
-        if dtype is None and shape is not None:
-            err = "If shape is specified, dtype must also be specified"
-            raise TorchTensorTypeError(err)
-
-    def __str__(self):
-        return f"Torch Tensor (shape={self.shape}, dtype={self.dtype})"
-
-    def to_mlir(self, context: ir.Context) -> ir.Type:
-        if self.dtype is None:
-            return ir.Type.parse("!torch.tensor", context=context)
-
-        shape_asm = self._shape_to_mlir_asm()
-        dtype_asm = self._dtype_to_mlir_asm()
-        return ir.Type.parse(
-            f"!torch.vtensor<{shape_asm},{dtype_asm}>", context=context
-        )
-
-    def _shape_to_mlir_asm(self) -> str:
-        if self.shape is None:
-            return "*"
-
-        str_sizes = map(lambda x: "?" if x is None else str(x), self.shape)
-        return f'[{",".join(str_sizes)}]'
-
-    def _dtype_to_mlir_asm(self) -> str:
-        if self.dtype in [torch.float64]:
-            return "f64"
-        if self.dtype in [torch.float, torch.float32]:
-            return "f32"
-        if self.dtype in [torch.int, torch.int32]:
-            return "si32"
-        if self.dtype in [torch.int64]:
-            return "si64"
-        if self.dtype in [torch.bool]:
-            return "i1"
-
-        raise NotImplementedError(f"Unsupported dtype: {self.dtype}")
-
-
-class TorchNnModuleType(TorchMlirType):
-    """This class is used to generate types for `!torch.nn.Module`s."""
-
-    def __init__(self, module_name: str):
-        self.module_name = module_name
-
-    def __str__(self):
-        return "torch.nn.Module"
-
-    def to_mlir(self, context: ir.Context) -> ir.Type:
-        return ir.Type.parse(f'!torch.nn.Module<"{self.module_name}">', context=context)
-
-
-class PythonType(TorchMlirType):
-    """
-    This class is used to convert regular Python types
-    into their corresponding `torch` dialect representation.
-    The list of supported types can be found in the dictionary
-    `_type_to_asm_dict`.
-    """
-
-    _type_to_asm_dict = {
-        bool: "!torch.bool",
-        int: "!torch.int",
-        type(None): "!torch.none",
-    }
-
-    def __init__(self, type_: Any):
-        self.type_ = type_
-
-    def __str__(self):
-        return str(self.type_)
-
-    def to_mlir(self, context: ir.Context) -> ir.Type:
-        asm = self._type_to_asm_dict.get(self.type_)
-        if asm is None:
-            raise NotImplementedError(f"Unsupported type: {self.type_}")
-        return ir.Type.parse(asm, context=context)
-
-
-# TODO: This functionality should be incorporated into ModuleBuilder.import_function.
-class Annotation:
-    def __init__(self, types: Iterable[Union[TorchTensorType, type]]):
-        self.types = list(
-            map(lambda t: PythonType(t) if isinstance(t, type) else t, types)
-        )
-
-    def __str__(self):
-        result = f"Annotation instance with {len(self.types)} types\n"
-        for e, type_ in enumerate(self.types):
-            result += f"    Type of argument {e + 1}: {str(type_)}\n"
-        return result
-
-    def __iter__(self):
-        return iter(self.types)
-
-
-class AnnotationConverter:
-    @staticmethod
-    def to_mlir_array_attr(annotation: Annotation, context: ir.Context) -> ir.ArrayAttr:
-        dict_attrs = []
-        for type_ in annotation:
-            if not isinstance(type_, TorchTensorType):
-                dict_attrs.append(ir.DictAttr.get({}, context=context))
-                continue
-
-            ir_type = type_.to_mlir(context)
-            with context:
-                type_attr = ir.TypeAttr.get(ir_type)
-                dict_attr = ir.DictAttr.get({"torch.type_bound": type_attr})
-                dict_attrs.append(dict_attr)
-
-        return ir.ArrayAttr.get(dict_attrs, context=context)
-
-
-def get_func_op_with_name(module: ir.Module, name: str) -> Optional[FuncOp]:
-    with module.context:
-        name_attr = ir.StringAttr.get(name)
-    for op in module.body.operations:
-        if isinstance(op, FuncOp) and op.name == name_attr:
-            # Add name of torch op as debug_module_name so that
-            # run_pipeline_with_repro_report can use it.
-            module.operation.attributes["torch.debug_module_name"] = name_attr
-            return op
-
-    return None
-
-
-def is_tensor_type(typ: torch._C.Type):
-    return typ.isSubtypeOf(torch.TensorType.get()) or (
-        isinstance(typ, torch.OptionalType)
-        and typ.getElementType().isSubtypeOf(torch._C.TensorType.get())
-    )
-
-
-def is_list_of_tensors_type(typ: torch._C.Type):
-    return isinstance(typ, torch.ListType) and is_tensor_type(typ.getElementType())
-
-
-name_mangle_regex = re.compile("[^a-zA-Z0-9]")
-
-
-def build_ts_script_function(
-    schema: torch._C.FunctionSchema, kwargs: Dict[str, Any]
-) -> torch.jit.ScriptFunction:
-    """Build a torch.jit.ScriptFunction that corresponds to the schema.
-
-    Constants are inlined for the purposes of invalidating the compile cache when they change.
-
-    Parameters
-    ----------
-    schema: torch._C.FunctionSchema
-        PyTorch's representation for ops, contains type information needed for inlining constants into the TS graph.
-    kwargs: Dict
-        A dictionary with all arguments passed in through __torch_dispatch__ (including int/float/bool params).
-
-    Returns
-    -------
-    torch.jit.ScriptFunction
-        Fully specialized (all constants) TS graph whose only arguments are tensors.
-    """
-
-    # Creates empty TS graph.
-    graph = torch._C.Graph()
-    # Creates and inserts node with identifier `schema.name`; NB node has no inputs or outputs at this point.
-    node = graph.insertNode(graph.create(schema.name, len(schema.returns)))
-    # Associate graph inputs/outputs with node inputs/outputs.
-    graph_inputs = []
-    for arg in schema.arguments:
-        arg_name = arg.name if arg.name != "self" else "input"
-
-        # If arg is a flattened list of tensors, such as in the case of torch.cat
-        # then add each element of the list to the graph corresponding to arg
-        # and insert a ListConstruct to function as input to the op.
-        if is_list_of_tensors_type(arg.type):
-            inps = []
-            for kwarg in [
-                kwarg for kwarg in kwargs if f"{arg_name}_flattened" in kwarg
-            ]:
-                inp = graph.addInput()
-                el_typ = arg.type.getElementType()
-                if isinstance(el_typ, torch.OptionalType):
-                    el_typ = el_typ.getElementType()
-                inp.setType(el_typ)
-                inp.setDebugName(kwarg)
-                inps.append(inp)
-                graph_inputs.append(kwarg)
-            list_cons = graph.insertNode(graph.create("prim::ListConstruct", inps))
-            list_cons.moveBefore(node)
-            inp = list_cons.output()
-            inp.setType(torch.ListType.ofTensors())
-        # If arg is a tensor, then add input to the graph corresponding to arg.
-        elif is_tensor_type(arg.type) and kwargs[arg_name] is not None:
-            inp = graph.addInput()
-            if isinstance(arg.type, torch.OptionalType):
-                el_typ = arg.type.getElementType()
-            else:
-                el_typ = arg.type
-            inp.setType(el_typ)
-            inp.setDebugName(arg_name)
-            graph_inputs.append(arg_name)
-        # If arg is a constant, inline (at the top of the graph).
-        else:
-            val = kwargs[arg_name]
-            if val == []:
-                # Some ops have empty list default values for args
-                # (such as aten::max_pool2d_with_indices with int[2] stride=[]
-                # but graph.insertConstant doesnt' recognize [] as an empty list IValue.
-                # This might be an upstream bug but there doesn't seem to be a way to
-                # build a prim::ListConstruct list that's empty.
-                val = None
-            inp = graph.insertConstant(val)
-            inp.node().moveBefore(node)
-
-        node.addInput(inp)
-
-    # Reorder graph inputs to match kwargs.
-    permutes = [
-        {inp: i for i, inp in enumerate(graph_inputs)}[kwarg]
-        for kwarg in [kwarg for kwarg in kwargs if kwarg in graph_inputs]
-    ]
-    graph.permuteInputs(permutes)
-
-    if node.hasMultipleOutputs():
-        for outp in node.outputs():
-            graph.registerOutput(outp)
-    else:
-        graph.registerOutput(node.output())
-
-    fn = torch._C._create_function_from_graph(
-        f"{name_mangle_regex.sub('', str(graph))}", graph
-    )
-    return fn
-
-
-def build_mlir_module(op: OpOverload, kwargs: Dict[str, Any]) -> ir.Module:
-    """Translate input function into an MLIR module in the `torch` dialect.
-
-    Parameters
-    ----------
-    op: OpOverload
-        Callable from the torch.ops.aten module/namespace that has a _schema field.
-    kwargs: Dict
-        A dictionary with all arguments passed in through __torch_dispatch__ (including int/float,bool params).
-
-    Returns
-    -------
-    ir.Module
-        Translation of the input module into an MLIR module.
-    """
-
-    # The assert here is to catch tensor shapes that have size 0 dimensions, such as those produced in
-    # the course of evaluating SliceEndSleStartModule_basic and SliceOutOfLowerBoundEndIndexModule_basic.
-    # Such 0 size dimensions fail the assert at mlir/lib/IR/BuiltinTypes.cpp, line 887
-    annotations = []
-    for arg_name, arg in kwargs.items():
-        if isinstance(arg, torch.Tensor):
-            assert np.prod(arg.shape) != 0, f"{arg_name} has invalid shape {arg.shape}"
-            annotations.append(TorchTensorType(shape=tuple(arg.shape), dtype=arg.dtype))
-    annotations = tuple(annotations)
-
-    script_fun = build_ts_script_function(op._schema, kwargs)
-    assert len(annotations) == len(
-        list(script_fun.graph.inputs())
-    ), "Number of annotations and number of graph inputs differs."
-
-    mb = ModuleBuilder()
-    mb.import_function(script_fun)
-
-    func_op = get_func_op_with_name(mb.module, script_fun.name)
-    assert (
-        func_op is not None
-    ), "Unable to find FuncOp in new module. Make sure function was imported correctly into ModuleBuilder"
-
-    func_annotation = Annotation(annotations)
-    arg_attrs = AnnotationConverter.to_mlir_array_attr(func_annotation, mb.context)
-    func_op.attributes["arg_attrs"] = arg_attrs
-
-    return mb.module
--- a/python/torch_mlir/eager_mode/torch_mlir_dispatch.py
+++ b/python/torch_mlir/eager_mode/torch_mlir_dispatch.py
@ -1,111 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-from __future__ import annotations
-
-from typing import Any, Callable, Tuple
-from typing import Dict
-
-import torch
-from torch.fx import immutable_collections
-from torch.fx.operator_schemas import (
-    _torchscript_schema_to_signature,
-    _args_kwargs_to_normalized_args_kwargs,
-)
-from torch_mlir._mlir_libs._jit_ir_importer import get_registered_ops
-
-from torch_mlir.dialects import torch as torch_dialect
-
-OP_REGISTRY = {op["name"]: op for op in get_registered_ops()}
-SUPPORTED_OPS = frozenset(
-    [
-        member.OPERATION_NAME
-        for member in vars(torch_dialect).values()
-        if hasattr(member, "OPERATION_NAME")
-    ]
-)
-
-
-class UnsupportedByTorchMlirEagerMode(Exception):
-    def __init__(self, value: str):
-        super().__init__()
-        self.value = value
-
-    def __str__(self) -> str:
-        return self.value
-
-
-def normalize_args_kwargs(target: Callable, args: Tuple[Any], kwargs: Dict[str, Any]):
-    """Fill in default values for optional args, which are dependent on the schema."""
-    sig = _torchscript_schema_to_signature(target._schema)
-    _, new_kwargs = _args_kwargs_to_normalized_args_kwargs(
-        sig, args, kwargs, normalize_to_only_use_kwargs=True
-    )
-    if "self" in new_kwargs:
-        new_kwargs["input"] = new_kwargs.pop("self")
-
-    # Flatten lists of args for ops that takes lists, such as torch.cat.
-    to_remove = set()
-    to_add = {}
-    for k, v in new_kwargs.items():
-        if isinstance(v, (tuple, list)) and len(v) and isinstance(v[0], torch.Tensor):
-            to_remove.add(k)
-            for i, vv in enumerate(v):
-                to_add[f"{k}_flattened_{i}"] = vv
-
-    for rem in to_remove:
-        del new_kwargs[rem]
-    new_kwargs.update(**to_add)
-
-    # Sort here in order to have consistency across TS graph and
-    # MLIR module.
-    sorted_kwargs = dict(sorted(new_kwargs.items()))
-    return immutable_collections.immutable_dict(sorted_kwargs)
-
-
-def get_registered_op(op):
-    registered_op = OP_REGISTRY[(op._schema.name, op._schema.overload_name)]
-    return registered_op
-
-
-def check_get_aliased_arg(func: Callable,):
-    """Write back to mutable args that aren't properly handled otherwise.
-
-    Because of how we pass values to the backend we don't currently support ops that mutate operands.
-    That includes both inplace variants and outplace variants. Additionally, Torch-MLIR,
-    as of right now, only handles arguments with value semantics, so we need to manually fake those semantics, which
-    we can for these special cases. Hence, the solution is to manually write back to the same operand that the
-    conventional pytorch op variant would write to.
-
-    Note that there are ops where multiple operands are mutable (such as batchnorm outplace variants that
-    mutate running_mean and running_var). We don't currently handle those.
-    """
-
-    registered_op = get_registered_op(func)
-    if not registered_op["is_mutable"]:
-        return None
-
-    if len(registered_op["returns"]) > 1:
-        raise UnsupportedByTorchMlirEagerMode(
-            "TorchMLIR doesn't handle multiple aliased returns yet."
-        )
-
-    aliased_arg = next(
-        arg
-        for arg in registered_op["arguments"]
-        if "alias_info" in arg and arg["alias_info"]["is_write"]
-    )
-    assert (
-        "alias_info" in registered_op["returns"][0]
-        and registered_op["returns"][0]["alias_info"]["is_write"]
-        and len(registered_op["returns"][0]["alias_info"]["after"]) == 1
-        and registered_op["returns"][0]["alias_info"]["after"][0]
-    )
-    assert (
-        len(aliased_arg["alias_info"]["after"]) == 1
-        and aliased_arg["alias_info"]["after"][0]
-        == registered_op["returns"][0]["alias_info"]["after"][0]
-    )
-
-    return aliased_arg["name"] if aliased_arg["name"] != "self" else "input"
--- a/python/torch_mlir/eager_mode/torch_mlir_eager_backend.py
+++ b/python/torch_mlir/eager_mode/torch_mlir_eager_backend.py
@ -1,102 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-import abc
-from dataclasses import dataclass
-from typing import TypeVar, Tuple, Callable, List, Dict, Any
-
-import torch
-
-from torch_mlir._mlir_libs._mlir.ir import Module
-
-# TODO: This might need to be an ABC too, such as
-# to support finding the backend that created the tensor.
-DeviceTensor = TypeVar("DeviceTensor")
-
-
-@dataclass(frozen=True)
-class TensorMetaData:
-    """A small container for metadata necessary for satisfying the pytorch dispatcher and other code (pytorch or
-    otherwise) that branches on these attributes.
-
-    There is a lot of code in the PyTorch codebase that branches based on these attributes; the obvious ones here
-    are dtype, device, and requires_grad (necessary for autograd itself). There is ample warning from PyTorch that,
-    in principle, these should be as close as possible to true; see
-    https://github.com/albanD/subclass_zoo/blob/1566e038f03cd89ab3cc37e670a44e3c2bbc1897/trivial_tensors.py#L90-L92
-
-    The defaults (properties) simplify the api and seem to work after some testing but
-    might malfunction in unexpected ways.
-    # TODO: revisit these assumptions
-    """
-
-    size: Tuple[int]
-    dtype: torch.dtype
-    requires_grad: bool
-
-    strides: Tuple[int]
-    storage_offset: int = 0
-    layout: torch.layout = torch.strided
-    device: torch.device = torch.device("cpu")
-
-    def __init__(
-        self,
-        size,
-        dtype,
-        requires_grad,
-        strides=None,
-        storage_offset=None,
-        layout=None,
-        device=None,
-    ):
-        super().__init__()
-        object.__setattr__(self, "size", size)
-        object.__setattr__(self, "dtype", dtype)
-        object.__setattr__(self, "requires_grad", requires_grad)
-
-        object.__setattr__(
-            self, "strides", strides if strides is not None else len(size) * [0]
-        )
-        object.__setattr__(
-            self, "storage_offset", storage_offset if storage_offset is not None else 0
-        )
-        object.__setattr__(
-            self, "layout", layout if layout is not None else torch.strided
-        )
-        object.__setattr__(
-            self, "device", device if device is not None else torch.device("cpu")
-        )
-
-
-class TorchMLIREagerBackend(abc.ABC):
-    @abc.abstractmethod
-    def compile(
-        self, module: Module
-    ) -> Callable[[List[DeviceTensor]], List[DeviceTensor]]:
-        raise NotImplementedError
-
-    @abc.abstractmethod
-    def transfer_from_torch_to_device(self, tensor: torch.Tensor) -> DeviceTensor:
-        """Unwrap the backend representation in order to build a torch.Tensor."""
-        raise NotImplementedError
-
-    @abc.abstractmethod
-    def get_torch_metadata(
-        self, tensor: DeviceTensor, kwargs: Dict[str, Any]
-    ) -> TensorMetaData:
-        """Parse relevant tensor metadata from backend device array (e.g., shape, stride, layout) in order to build
-        wrapper tensor."""
-        raise NotImplementedError
-
-    @abc.abstractmethod
-    def transfer_from_device_to_torch(self, tensor: DeviceTensor) -> torch.Tensor:
-        """If compilation fails for some reason then device specific representations need to be munged into a
-        torch.Tensor representation.
-        """
-        raise NotImplementedError
-
-    @abc.abstractmethod
-    def copy_into(self, dst: DeviceTensor, src: DeviceTensor):
-        """This method is needed for things like handling aliased arguments."""
-        raise NotImplementedError
--- a/python/torch_mlir/eager_mode/torch_mlir_tensor.py
+++ b/python/torch_mlir/eager_mode/torch_mlir_tensor.py
@ -1,257 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-import contextlib
-import re
-import traceback
-import warnings
-from typing import Any
-
-import torch
-from torch.utils._pytree import tree_map
-
-from torch_mlir.eager_mode.ir_building import build_mlir_module
-from torch_mlir.eager_mode.torch_mlir_dispatch import (
-    UnsupportedByTorchMlirEagerMode,
-    normalize_args_kwargs,
-    check_get_aliased_arg,
-)
-from torch_mlir.eager_mode import EAGER_MODE_DEBUG
-from torch_mlir_e2e_test.eager_backends.refbackend import EagerModeRefBackend
-
-
-@contextlib.contextmanager
-def no_dispatch():
-    """Prevent infinite recursion in case accidentally calling a tensor method on a TorchMLIRTensor within
-    __torch_dispatch__."""
-
-    guard = torch._C._DisableTorchDispatch()
-    try:
-        yield
-    finally:
-        del guard
-
-
-backend = EagerModeRefBackend()
-
-UNSUPPORTED_OPS = re.compile(
-    "|".join([
-        # We don't handle detach as it only pertains to autograd graph construction, which is handled by pytorch.
-        "detach",
-        # We don't handle _local_scalar_dense because it's just a way to unwrap a tensor that wraps a number.
-        "_local_scalar_dense",
-        # https://github.com/llvm/torch-mlir/issues/878
-        "_unsafe_view",
-        "view",
-    ])
-)
-
-
-class TorchMLIRTensor(torch.Tensor):
-    """This class serves the role abstract class with common functionality for dispatching through Torch-MLIR instead of aten.
-
-    It defers device specific behavior to device specific implementations. The deriving classes use the
-    make_bare_wrapper_subclass convenience method, adjacent here, and override __torch_dispatch__ in order to dispatch
-    through Torch-MLIR instead of aten. Backends are free to choose whatever representation of the buffers (i.e., `elem`)
-    and are expected to provide conversion mechanisms between their representation and torch.Tensor.
-
-    Here we only verify that inputs abide by current supported features of Torch-MLIR (contiguous memory and
-    strided tensor layout) and build the mlir module. Importantly, we also recover from any malfunctions in the
-    deriving classes and dispatch back to conventional PyTorch.
-
-    More documentation on how the __torch_dispatch__ pattern works can be found in this forum post
-    https://dev-discuss.pytorch.org/t/what-and-why-is-torch-dispatch/557
-    and this RFC
-    https://github.com/pytorch/rfcs/blob/master/RFC-0001-torch-function-for-methods.md#process-followed-during-a-functionmethod-call
-    and this repo with many examples
-    https://github.com/albanD/subclass_zoo
-    """
-
-    elem: Any
-
-    __slots__ = ["elem"]
-
-    def __new__(cls, elem, **kwargs):
-        """Wrap elem (which could be a torch.Tensor or otherwise) in a torch.Tensor subclass.
-
-        Critically, this method needs to parse relevant metadata from the device representation
-        (such as shape, striding, dtype, etc.) and translate it into torch conventions.
-
-        Deriving classes must provide a way to construct themselves from either their device specific representation
-        or torch.Tensor; the latter is to handle the case that dispatch to PyTorch to recover from an error.
-        """
-        if kwargs.get("constructing_from_device_tensor", False):
-            tensor_meta_data = backend.get_torch_metadata(elem, kwargs)
-            r = make_bare_wrapper_subclass(
-                cls=cls,
-                size=tensor_meta_data.size,
-                strides=tensor_meta_data.strides,
-                storage_offset=tensor_meta_data.storage_offset,
-                dtype=tensor_meta_data.dtype,
-                layout=tensor_meta_data.layout,
-                device=tensor_meta_data.device,
-                requires_grad=tensor_meta_data.requires_grad,
-            )
-            r.elem = elem
-        elif isinstance(elem, torch.nn.Parameter):
-            r = make_wrapper_subclass_from_torch_tensor(cls, elem.data, **kwargs)
-            r.elem = backend.transfer_from_torch_to_device(elem.detach().data)
-        elif isinstance(elem, torch.Tensor):
-            r = make_wrapper_subclass_from_torch_tensor(cls, elem, **kwargs)
-            r.elem = backend.transfer_from_torch_to_device(elem)
-        # This branch handles the case when a python scalar is passed to some op
-        # or is returned from some aten op, such as _local_scalar_dense.
-        elif isinstance(elem, (int, float, bool)):
-            return elem
-        else:
-            raise ValueError(f"Unknown element type: {type(elem)}")
-
-        return r
-
-    def __repr__(self):
-        if self.grad_fn:
-            return f"TorchMLIRTensor({self.elem}, backend={backend.__class__.__name__}, grad_fn={self.grad_fn})"
-        else:
-            return f"TorchMLIRTensor({self.elem}, backend={backend.__class__.__name__})"
-
-    @classmethod
-    def __torch_dispatch__(cls, func, _types, args=(), kwargs=None):
-        requires_grad = check_requires_grad(*args, **kwargs)
-        try:
-            with no_dispatch():
-                if hasattr(func, "op_name"):
-                    op_name = func.op_name
-                elif hasattr(func, "__name__"):
-                    # Handle builtin_function_or_method.
-                    op_name = func.__name__
-                else:
-                    raise RuntimeError(f"op {func} has no name")
-
-                requires_grad = requires_grad and "view" not in op_name
-
-                if UNSUPPORTED_OPS.match(op_name):
-                    raise UnsupportedByTorchMlirEagerMode(op_name)
-
-                if not hasattr(func, "_schema"):
-                    raise RuntimeError(f"op {func} has no schema.")
-
-                normalized_kwargs = normalize_args_kwargs(func, args, kwargs)
-
-                if "layout" in normalized_kwargs and normalized_kwargs[
-                    "layout"
-                ] not in {0, None}:
-                    raise UnsupportedByTorchMlirEagerMode(
-                        f"{normalized_kwargs['layout']} layout not supported."
-                    )
-                if "memory_format" in normalized_kwargs and normalized_kwargs[
-                    "memory_format"
-                ] not in {0, None}:
-                    raise UnsupportedByTorchMlirEagerMode(
-                        f"{normalized_kwargs['memory_format']} memory format not supported."
-                    )
-                eager_module = build_mlir_module(func, normalized_kwargs)
-            device_tensor_args = [
-                kwarg.elem
-                for _, kwarg in normalized_kwargs.items()
-                if isinstance(kwarg, cls)
-            ]
-            assert len(eager_module.body.operations[0].arguments) == len(
-                device_tensor_args
-            ), "Number of parameters and number of arguments differs."
-            op_mlir_backend_callable = backend.compile(eager_module)
-            out = op_mlir_backend_callable(*device_tensor_args)
-            out = tree_map(
-                lambda x: cls(
-                    x, requires_grad=requires_grad, constructing_from_device_tensor=True
-                ),
-                out,
-            )
-        except Exception as e:
-            if EAGER_MODE_DEBUG:
-                warnings.warn(traceback.format_exc())
-                if isinstance(e, UnsupportedByTorchMlirEagerMode):
-                    warnings.warn(
-                        f"Couldn't use TorchMLIR eager because current incompatibility: *{str(e)}*; running through PyTorch eager."
-                    )
-                else:
-                    warnings.warn(
-                        f"Couldn't use TorchMLIR eager because of error: *{str(e)}*; "
-                        f"running through PyTorch eager. Please file an issue at https://github.com/llvm/torch-mlir/issues"
-                    )
-
-            with no_dispatch():
-                unwrapped_args = tree_map(cls.unwrap, args)
-                unwrapped_kwargs = tree_map(cls.unwrap, kwargs)
-                out = func(*unwrapped_args, **unwrapped_kwargs)
-
-            out = tree_map(lambda x: cls(x, requires_grad=requires_grad), out)
-
-        maybe_aliased_arg_name = check_get_aliased_arg(func)
-        if maybe_aliased_arg_name is not None:
-            backend.copy_into(normalized_kwargs[maybe_aliased_arg_name].elem, out.elem)
-
-        return out
-
-    @classmethod
-    def unwrap(cls, e):
-        """Unwrap the TorchMLIRTensor representation in order to access the actual device specific representation."""
-        if isinstance(e, cls):
-            return backend.transfer_from_device_to_torch(e.elem)
-        return e
-
-
-def check_requires_grad(*args, **kwargs):
-    requires_grad = False
-
-    def check_grad(e):
-        nonlocal requires_grad
-        if isinstance(e, TorchMLIRTensor):
-            requires_grad |= e.requires_grad
-
-    tree_map(check_grad, args)
-    tree_map(check_grad, kwargs)
-
-    return requires_grad
-
-
-def make_wrapper_subclass_from_torch_tensor(cls, elem, **kwargs):
-    """Convenience method that parse out relevant metadata from a torch.Tensor, in order to produce
-    a wrapper subclass.
-
-    NB: this convenience method does not set that `elem` attribute of the subclass, as that is the responsibility
-    of the device specific implementation.
-    """
-    r = make_bare_wrapper_subclass(
-        cls=cls,
-        size=elem.size(),
-        strides=elem.stride(),
-        storage_offset=elem.storage_offset(),
-        dtype=elem.dtype,
-        layout=elem.layout,
-        device=elem.device,
-        # Only float tensors can have gradients.
-        requires_grad=elem.dtype in {torch.float, torch.float32, torch.float64}
-        and (kwargs.get("requires_grad", False) or elem.requires_grad),
-    )
-    return r
-
-
-def make_bare_wrapper_subclass(
-    *, cls, size, strides, storage_offset, dtype, layout, device, requires_grad
-):
-    """Convenience method that builds a wrapper subclass.
-
-    NB: this convenience method does not set that `elem` attribute of the subclass, as that is the responsibility
-    of the device specific implementation.
-    """
-    return torch.Tensor._make_wrapper_subclass(
-        cls,
-        size,
-        strides=strides,
-        storage_offset=storage_offset,
-        dtype=dtype,
-        layout=layout,
-        device=device,
-        requires_grad=requires_grad,
-    )
--- a/python/torch_mlir_e2e_test/configs/init.py
+++ b/python/torch_mlir_e2e_test/configs/init.py
@ -9,5 +9,4 @@ from .native_torch import NativeTorchTestConfig
 from .torchscript import TorchScriptTestConfig
 from .mhlo_backend import MhloBackendTestConfig
 from .tosa_backend import TosaBackendTestConfig
-from .eager_mode import EagerModeTestConfig
 from .torchdynamo import TorchDynamoTestConfig
--- a/python/torch_mlir_e2e_test/configs/eager_mode.py
+++ b/python/torch_mlir_e2e_test/configs/eager_mode.py
@ -1,65 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-import torch
-from torch.utils._pytree import tree_map
-
-from torch_mlir.eager_mode.torch_mlir_tensor import TorchMLIRTensor
-from torch_mlir_e2e_test.framework import TestConfig, Trace, TraceItem
-
-
-def wrap(e):
-    return TorchMLIRTensor(e.detach().clone()) if isinstance(e, torch.Tensor) else e
-
-
-def unwrap(e):
-    return TorchMLIRTensor.unwrap(e) if isinstance(e, TorchMLIRTensor) else e
-
-
-def to_tmt(m: torch.nn.Module):
-    for buf_name, buf in m.named_buffers(recurse=True):
-        if isinstance(buf, TorchMLIRTensor):
-            continue
-        m.register_buffer(buf_name, TorchMLIRTensor(buf))
-    for param_name, param in m.named_parameters(recurse=True):
-        if isinstance(param, TorchMLIRTensor):
-            continue
-        m.register_parameter(
-            param_name,
-            torch.nn.Parameter(
-                TorchMLIRTensor(param), requires_grad=param.requires_grad
-            ),
-        )
-    for attr in dir(m):
-        field = getattr(m, attr)
-        if isinstance(field, torch.Tensor) and not isinstance(field, TorchMLIRTensor):
-            setattr(m, attr, TorchMLIRTensor(field))
-
-
-class EagerModeTestConfig(TestConfig):
-    """Trivial test config that exercises eager mode plumbing"""
-
-    def __init__(self):
-        super().__init__()
-
-    def compile(self, program: torch.nn.Module) -> torch.nn.Module:
-        program.apply(to_tmt)
-        return program
-
-    def run(self, artifact: torch.nn.Module, trace: Trace) -> Trace:
-        result: Trace = []
-        for item in trace:
-            attr = artifact
-            for part in item.symbol.split("."):
-                attr = getattr(attr, part)
-
-            inps = tree_map(wrap, item.inputs)
-            outps = attr(*inps)
-            output = tree_map(unwrap, outps)
-
-            result.append(
-                TraceItem(symbol=item.symbol, inputs=item.inputs, output=output)
-            )
-        return result
--- a/python/torch_mlir_e2e_test/eager_backends/refbackend.py
+++ b/python/torch_mlir_e2e_test/eager_backends/refbackend.py
@ -1,90 +0,0 @@
-# Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
-# See https://llvm.org/LICENSE.txt for license information.
-# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
-# Also available under a BSD-style license. See LICENSE.
-
-from __future__ import annotations
-
-from typing import Dict, Any
-
-import numpy as np
-import torch
-
-from torch_mlir.compiler_utils import (
-    get_module_name_for_debug_dump,
-    run_pipeline_with_repro_report,
-)
-from torch_mlir.eager_mode.torch_mlir_eager_backend import (
-    TorchMLIREagerBackend,
-    TensorMetaData,
-)
-from torch_mlir.ir import Module
-from torch_mlir_e2e_test.linalg_on_tensors_backends.refbackend import (
-    RefBackendLinalgOnTensorsBackend,
-)
-
-NUMPY_TO_TORCH_DTYPE_DICT = {
-    np.bool_: torch.bool,
-    np.uint8: torch.uint8,
-    np.int8: torch.int8,
-    np.int16: torch.int16,
-    np.int32: torch.int32,
-    np.int64: torch.int64,
-    np.float16: torch.float16,
-    np.float32: torch.float32,
-    np.float64: torch.float64,
-    np.complex64: torch.complex64,
-    np.complex128: torch.complex128,
-}
-
-_ref_backend = RefBackendLinalgOnTensorsBackend()
-
-
-class EagerModeRefBackend(TorchMLIREagerBackend):
-    """Main entry-point for the reference backend for eager mode.
-
-    RefBackend uses numpy.ndarray representations of tensors and thus all of the wrapping and unwrapping
-    and munging here is done to between torch.Tensor and numpy.ndarray.
-    """
-
-    module_to_refbackend_invoker = {}
-
-    def get_torch_metadata(
-        self, tensor: np.ndarray, kwargs: Dict[str, Any]
-    ) -> TensorMetaData:
-        return TensorMetaData(
-            size=tensor.shape,
-            dtype=NUMPY_TO_TORCH_DTYPE_DICT[tensor.dtype.type],
-            requires_grad=tensor.dtype in {np.float, np.float32, np.float64}
-            and kwargs.get("requires_grad", False),
-        )
-
-    def compile(self, imported_module: Module):
-        """Lower the imported TS module to linalg and then further compile for the reference backend and then call."""
-        fn_name = get_module_name_for_debug_dump(imported_module)
-        module_hash = str(imported_module)
-        if module_hash not in self.module_to_refbackend_invoker:
-            run_pipeline_with_repro_report(
-                imported_module,
-                "builtin.module(torch-function-to-torch-backend-pipeline,torch-backend-to-linalg-on-tensors-backend-pipeline)",
-                "EagerMode",
-            )
-            self.module_to_refbackend_invoker[module_hash] = _ref_backend.load(
-                _ref_backend.compile(imported_module)
-            )
-
-        ref_backend_invoker = self.module_to_refbackend_invoker[module_hash]
-        op_mlir_backend_callable = getattr(ref_backend_invoker, fn_name)
-        assert (
-            op_mlir_backend_callable is not None
-        ), f"Couldn't find function in module."
-        return op_mlir_backend_callable
-
-    def copy_into(self, dst: np.ndarray, src: np.ndarray):
-        np.copyto(dst, src)
-
-    def transfer_from_device_to_torch(self, e: np.ndarray):
-        return torch.from_numpy(e).clone()
-
-    def transfer_from_torch_to_device(self, tensor: torch.Tensor) -> np.ndarray:
-        return tensor.detach().numpy()