Add BertSequenceClassification model to e2e

Use torch tracing to get the module because the original model is not TorchScriptable out of box.
2021-09-28 10:56:08 -04:00 · 2021-09-28 10:56:08 -04:00 · 89225b0cd8
parent 649d6e4f28
commit 89225b0cd8
6 changed files with 112 additions and 0 deletions
--- a/build_tools/torchscript_e2e_heavydep_tests/bert_seq_classification.py
+++ b/build_tools/torchscript_e2e_heavydep_tests/bert_seq_classification.py
@ -0,0 +1,70 @@
 # Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 # See https://llvm.org/LICENSE.txt for license information.
 # SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 # Also available under a BSD-style license. See LICENSE.
 # Basic BertForSequenceClassification program to classify the input sentence.
 import torch
 from transformers import BertForSequenceClassification, BertTokenizer
 from torch_mlir_e2e_test.torchscript.framework import TestUtils
 from torch_mlir_e2e_test.torchscript.registry import register_test_case
 from torch_mlir_e2e_test.torchscript.annotations import annotate_args, export
 torch.manual_seed(0)
 CLS = "[CLS]"
 SEP = "[SEP]"
 tokenizer = BertTokenizer.from_pretrained("bert-base-uncased")
 def _prepare_sentence_tokens(sentence: str):
    return torch.tensor([tokenizer.encode(sentence)])
 class BasicBertSequenceClassification(torch.nn.Module):
    def __init__(self):
        super().__init__()
        self.model = BertForSequenceClassification.from_pretrained(
            "bert-base-uncased",  # Use the 12-layer BERT model, with an uncased vocab.
            num_labels=
            2,  # The number of output labels--2 for binary classification.
            output_attentions=
            False,  # Whether the model returns attentions weights.
            output_hidden_states=
            False,  # Whether the model returns all hidden-states.
            torchscript=True)
        self.model.eval()
    @export
    @annotate_args([
        None,
        ([-1, -1], torch.int64, True),
    ])
    def forward(self, tokens):
        return self.model.forward(tokens)[0]
 trace_input = {
    'forward': _prepare_sentence_tokens("how do you like the project")
 }
 test_input = _prepare_sentence_tokens("this project is very interesting")
 def getTracedRecursiveScriptModule():
    traced_module = torch.jit.trace_module(BasicBertSequenceClassification(),
                                           trace_input)
    script_module = traced_module._actual_script_module
    export(script_module.forward)
    annotate_args_decorator = annotate_args([
        None,
        ([-1, -1], torch.int64, True),
    ])
    annotate_args_decorator(script_module.forward)
    return script_module
@register_test_case(module_factory=lambda: getTracedRecursiveScriptModule())
 def BasicBertSequenceClassification_basic(module, tu: TestUtils):
    module.forward(test_input)
--- a/build_tools/torchscript_e2e_heavydep_tests/generate_serialized_tests.sh
+++ b/build_tools/torchscript_e2e_heavydep_tests/generate_serialized_tests.sh
@ -20,6 +20,9 @@ mkdir -p $venv_dir
 mkdir -p $serialized_test_dir
 python3 -m venv $venv_dir
 source $venv_dir/bin/activate
 # For bert_seq_classification
 python3 -m pip install transformers
 # For basic_mt
 python3 -m pip install fairseq fvcore sacremoses subword-nmt
 cd "$torch_mlir_src_root"
--- a/build_tools/torchscript_e2e_heavydep_tests/main.py
+++ b/build_tools/torchscript_e2e_heavydep_tests/main.py
@ -13,6 +13,7 @@ from torch_mlir_e2e_test.torchscript.framework import SerializableTest, generate
 from torch_mlir_e2e_test.torchscript.annotations import extract_serializable_annotations
 from . import basic_mt
 from . import bert_seq_classification
 def _get_argparse():
--- a/include/torch-mlir/Dialect/Torch/IR/TorchOps.td
+++ b/include/torch-mlir/Dialect/Torch/IR/TorchOps.td
@ -563,6 +563,22 @@ def Torch_ConstantStrOp : Torch_Op<"constant.str",
  let hasFolder = 1;
 }
 def Torch_ConstantDeviceOp : Torch_Op<"constant.device",
    [NoSideEffect,
    DeclareOpInterfaceMethods<OpAsmOpInterface, ["getAsmResultNames"]>]> {
  let summary = "Materialize a constant Device value.";
  let description = [{
  }];
  let arguments = (ins
    StrAttr:$value
  );
  let results = (outs
    Torch_DeviceType:$result
  );
  let assemblyFormat = "$value attr-dict";
 }
 def Torch_ConstantIntOp : Torch_Op<"constant.int",
    [ConstantLike, NoSideEffect,
    DeclareOpInterfaceMethods<OpAsmOpInterface, ["getAsmResultNames"]>]> {
--- a/lib/Dialect/Torch/IR/TorchOps.cpp
+++ b/lib/Dialect/Torch/IR/TorchOps.cpp
@ -738,6 +738,15 @@ void ConstantStrOp::getAsmResultNames(
  setNameFn(getResult(), "str");
 }
 //===----------------------------------------------------------------------===//
 // ConstantDeviceOp
 //===----------------------------------------------------------------------===//
 void ConstantDeviceOp::getAsmResultNames(
    function_ref<void(Value, StringRef)> setNameFn) {
  setNameFn(getResult(), value());
 }
 //===----------------------------------------------------------------------===//
 // ConstantIntOp
 //===----------------------------------------------------------------------===//
--- a/python/torch_mlir/dialects/torch/importer/jit_ir/csrc/node_importer.cpp
+++ b/python/torch_mlir/dialects/torch/importer/jit_ir/csrc/node_importer.cpp
@ -156,6 +156,19 @@ void NodeImporter::importNode(Node *node, MlirBlock appendToBlock) {
          toMlirNamedAttribute(
              "value", mlirStringAttrGet(context, toMlirStringRef(node->s(
                                                      c10::attr::value)))));
    } else if (output->type()->cast<c10::TensorType>()) {
      MlirAttribute attr = importAttribute(loc, node, c10::attr::value);
      op = createMlirOperation(
          "torch.tensor.literal", loc,
          torchMlirTorchNonValueTensorTypeGetFromAttribute(attr),
          toMlirNamedAttribute("value", attr));
    } else if (output->type()->cast<c10::DeviceObjType>()) {
      op = createMlirOperation(
          "torch.constant.device", loc,
          getMlirTypeFromTorchType(loc, output->type()),
          toMlirNamedAttribute(
              "value", mlirStringAttrGet(context, toMlirStringRef(node->s(
                                                      c10::attr::value)))));
    } else if (auto functionType = output->type()->cast<c10::FunctionType>()) {
      torch::jit::Function *function = functionType->function();
      const std::string &symName = function->qualname().qualifiedName();