From 6920876c62525fabd591def64048e608e583f0af Mon Sep 17 00:00:00 2001
From: George S <113141689+gs-olive@users.noreply.github.com>
Date: Fri, 21 Jul 2023 12:22:55 -0700
Subject: [PATCH] fix/feat: Add Dynamo-only converter registry (#1944)

---
 py/torch_tensorrt/dynamo/__init__.py          |   6 +-
 .../dynamo/conversion/converter_utils.py      |  30 ++
 .../dynamo/conversion/trt_interpreter.py      |  17 +-
 .../dynamo/converter_registry.py              | 335 ++++++++++++++++++
 .../dynamo/lowering/_partition.py             |  32 +-
 py/torch_tensorrt/fx/converter_registry.py    |  11 +
 6 files changed, 408 insertions(+), 23 deletions(-)
 create mode 100644 py/torch_tensorrt/dynamo/conversion/converter_utils.py
 create mode 100644 py/torch_tensorrt/dynamo/converter_registry.py

diff --git a/py/torch_tensorrt/dynamo/__init__.py b/py/torch_tensorrt/dynamo/__init__.py
index 3cd3a24b59..63a3308fe2 100644
--- a/py/torch_tensorrt/dynamo/__init__.py
+++ b/py/torch_tensorrt/dynamo/__init__.py
@@ -3,5 +3,9 @@
 
 if version.parse(sanitized_torch_version()) >= version.parse("2.1.dev"):
     from ._settings import *
-    from .compile import compile
     from .aten_tracer import trace
+    from .converter_registry import (
+        DYNAMO_CONVERTERS,
+        dynamo_tensorrt_converter,
+    )
+    from .compile import compile
diff --git a/py/torch_tensorrt/dynamo/conversion/converter_utils.py b/py/torch_tensorrt/dynamo/conversion/converter_utils.py
new file mode 100644
index 0000000000..4471931e4c
--- /dev/null
+++ b/py/torch_tensorrt/dynamo/conversion/converter_utils.py
@@ -0,0 +1,30 @@
+import torch
+
+
+def dynamic_unsupported(node: torch.fx.Node) -> bool:
+    # Validate that none of the inputs to the node have Dynamic shapes
+    assert isinstance(
+        node, torch.fx.Node
+    ), "Inputs to validator functions must be FX Nodes"
+
+    # Check node value itself
+    if getattr(node.meta["val"], "_has_symbolic_sizes_strides", False):
+        return False
+
+    # Check node arguments individually
+    if any(
+        getattr(arg.meta["val"], "_has_symbolic_sizes_strides", False)
+        for arg in node.args
+        if isinstance(arg, torch.fx.Node)
+    ):
+        return False
+
+    # Check node keyword arguments individually
+    if any(
+        getattr(kwarg.meta["val"], "_has_symbolic_sizes_strides", False)
+        for kwarg in node.kwargs.values()
+        if isinstance(kwarg, torch.fx.Node)
+    ):
+        return False
+
+    return True
diff --git a/py/torch_tensorrt/dynamo/conversion/trt_interpreter.py b/py/torch_tensorrt/dynamo/conversion/trt_interpreter.py
index 18fc050637..6b72d87ff6 100644
--- a/py/torch_tensorrt/dynamo/conversion/trt_interpreter.py
+++ b/py/torch_tensorrt/dynamo/conversion/trt_interpreter.py
@@ -10,11 +10,10 @@
 import tensorrt as trt
 import torch
 import torch.fx
-from torch._ops import OpOverload
 from torch.fx.node import _get_qualified_name
 from torch.fx.passes.shape_prop import TensorMetadata
 
-from torch_tensorrt.fx import CONVERTERS
+from torch_tensorrt.dynamo import DYNAMO_CONVERTERS as CONVERTERS
 from torch_tensorrt import Input
 from torch_tensorrt.fx.observer import Observer
 from torch_tensorrt.fx.utils import (
@@ -69,6 +68,7 @@ def __init__(
         self.input_specs = input_specs
         self.input_specs_iter = 0
         self._cur_node_name: Optional[str] = None
+        self._cur_node: Optional[torch.fx.Node] = None
         self._input_names: List[str] = []
         self._output_names: List[str] = []
         self._itensor_to_tensor_meta: Dict[
@@ -82,14 +82,14 @@ def validate_conversion(self):
         missing_converter = set()
 
         for node in self.module.graph.nodes:
-            if node.op == "call_function" and not CONVERTERS.get(node.target):
+            if node.op == "call_function" and not CONVERTERS.get(node):
                 missing_converter.add(f"{node.op} {_get_qualified_name(node.target)}")
-            elif node.op == "call_method" and not CONVERTERS.get(node.target):
+            elif node.op == "call_method" and not CONVERTERS.get(node):
                 missing_converter.add(f"{node.op} torch.Tensor.{node.target}")
             elif node.op == "call_module":
                 submod = self.fetch_attr(node.target)
                 submod_type = getattr(submod, "_base_class_origin", type(submod))
-                if not CONVERTERS.get(submod_type):
+                if not CONVERTERS.get(node):
                     missing_converter.add(f"{node.op} {torch.typename(submod_type)}")
 
         return missing_converter
@@ -226,6 +226,7 @@ def run(
 
     def run_node(self, n):
         self._cur_node_name = str(n)
+        self._cur_node = n
         # add "_itensor_to_tensor_meta"
         kwargs = dict(n.kwargs)
         kwargs["_itensor_to_tensor_meta"] = self._itensor_to_tensor_meta
@@ -276,7 +277,7 @@ def call_module(self, target, args, kwargs):
         assert isinstance(target, str)
         submod = self.fetch_attr(target)
         submod_type = getattr(submod, "_base_class_origin", type(submod))
-        converter = CONVERTERS.get(submod_type)
+        converter = CONVERTERS.get(self._cur_node)
 
         if not converter:
             raise RuntimeError(
@@ -287,7 +288,7 @@ def call_module(self, target, args, kwargs):
         return converter(self.network, submod, args, kwargs, self._cur_node_name)
 
     def call_function(self, target, args, kwargs):
-        converter = CONVERTERS.get(target)
+        converter = CONVERTERS.get(self._cur_node)
         if not converter:
             raise RuntimeError(
                 f"Conversion of function {torch.typename(target)} not currently supported!"
@@ -298,7 +299,7 @@ def call_function(self, target, args, kwargs):
 
     def call_method(self, target, args, kwargs):
         assert isinstance(target, str)
-        converter = CONVERTERS.get(target)
+        converter = CONVERTERS.get(self._cur_node)
 
         if not converter:
             raise RuntimeError(
diff --git a/py/torch_tensorrt/dynamo/converter_registry.py b/py/torch_tensorrt/dynamo/converter_registry.py
new file mode 100644
index 0000000000..e29e5b8437
--- /dev/null
+++ b/py/torch_tensorrt/dynamo/converter_registry.py
@@ -0,0 +1,335 @@
+import logging
+from dataclasses import dataclass, field
+from typing import Any, Callable, Dict, Optional, Sequence, Union
+from enum import Enum, auto
+
+from torch.fx.node import Target, Node, _get_qualified_name
+from torch_tensorrt.fx.converter_registry import CONVERTERS
+
+
+logger = logging.getLogger(__name__)
+
+
+class ConverterPriority(Enum):
+    """Enum to set a converter's priority in the registry"""
+
+    STANDARD = auto()
+    HIGH = auto()
+
+
+@dataclass(frozen=True)
+class ConverterSupport:
+    """Class representing a converter implementation and support function
+
+    Args:
+        converter_implementation: Function which converts said node to a TRT equivalent
+        capability_validator: Function which takes in a Node and returns a bool indicating
+            whether that node can be supported by its companion converter. Note that
+            this function must not modify the node or its graph
+    """
+
+    converter_implementation: Callable
+    capability_validator: Callable[[Node], bool] = field(default=lambda node: True)
+
+
+# Dictionary representing Dynamo aten-only converters
+# Each converter maps to a sequence of at least one ConverterSupport object(s)
+DYNAMO_ATEN_CONVERTERS: Dict[Target, Sequence[ConverterSupport]] = {}
+
+
+def dynamo_tensorrt_converter(
+    key: Target,
+    enabled: bool = True,
+    capability_validator: Optional[Callable[[Node], bool]] = None,
+    priority: ConverterPriority = ConverterPriority.STANDARD,
+) -> Callable[[Any], Any]:
+    """Decorator for Dynamo TensorRT Converter
+
+    Registers the decorated function in the DYNAMO_ATEN_CONVERTERS registry
+
+    Args:
+        key: Node target for which the converter is implemented for
+            (for example, torch.ops.add.Tensor)
+        enabled: Whether the converter should be enabled/cached or not
+        capability_validator: Function which evaluates whether a node is valid for conversion
+            by the decorated converter. See ConverterSupport for more details.
+            Defaults to None, implying the capability_validator function is always true -
+            this means all nodes of "key" kind can be supported by this converter
+        priority: Converter's level of priority relative to other converters with the
+            same target
+    Returns:
+        The converter being decorated
+    """
+
+    def register_converter(converter):
+        """Helper function to register the converter, then return it"""
+        assert callable(converter), "Converter function must be callable"
+
+        # If no capability_validator function is specified, use the default function - always return true
+        if capability_validator is None:
+            converter_support = ConverterSupport(converter_implementation=converter)
+        else:
+            assert callable(
+                capability_validator
+            ), "Argument checking function must be callable"
+            converter_support = ConverterSupport(
+                converter_implementation=converter,
+                capability_validator=capability_validator,
+            )
+
+        # If a converter for this operator already exists, append the new converter to the list
+        # Otherwise, start a new list
+        if key in DYNAMO_ATEN_CONVERTERS:
+            # High priority converters are inserted at the front of the list,
+            # so they can be checked first by the registry
+            if priority is ConverterPriority.HIGH:
+                DYNAMO_ATEN_CONVERTERS[key].insert(0, converter_support)
+            else:
+                DYNAMO_ATEN_CONVERTERS[key].append(converter_support)
+        else:
+            DYNAMO_ATEN_CONVERTERS[key] = [converter_support]
+
+        logger.debug(
+            f"Converter for {key} added to Dynamo ATen Converter Registry with priority: {priority}"
+        )
+
+        return converter
+
+    def disable_converter(converter):
+        return converter
+
+    # Select whether to cache/enable the converter
+    if enabled:
+        return register_converter
+    else:
+        return disable_converter
+
+
+class ConverterRegistry:
+    """Registry for storing multiple converter dictionaries
+
+    Capable of storing dictionaries with the following signature:
+    Dict[Target, Union[Callable, Sequence[ConverterSupport]]]
+
+    Also able to validate converter implementations against user-provided
+    argument-checking functions
+
+    Args:
+        registries: List of dictionaries representing converter registries.
+            The order of the provided dictionaries is the order in which they
+            will be traversed. This is only significant when using non-validated
+            methods.
+    """
+
+    def __init__(
+        self,
+        registries: Sequence[Dict[Target, Union[Callable, Sequence[ConverterSupport]]]],
+        registry_names: Optional[Sequence[str]] = None,
+    ):
+        # Copy reference to each dictionary object into attribute list
+        self.registries = [registry for registry in registries]
+
+        if registry_names is not None:
+            assert len(self.registries) == len(registry_names)
+            self.registry_names = [name for name in registry_names]
+        else:
+            self.registry_names = [
+                f"Registry {i + 1}" for i in range(len(self.registries))
+            ]
+
+        self.validate_invariants()
+
+    def validate_invariants(self):
+        """Validates the invariants required of the dictionaries in the registries
+
+        Raises AssertionError if any invariants have been violated
+        """
+        # All registries must be dictionaries
+        assert all(isinstance(elt, dict) for elt in self.registries)
+
+        # Every dictionary in the registry must have one of two signatures:
+        # Dict[Target, Callable] or Dict[Target, Sequence[ConverterSupport]]
+        # Where, for the latter, the sequence must be non-empty
+        for registry in self.registries:
+            for converters in registry.values():
+                if isinstance(converters, (list, tuple)):
+                    assert (
+                        all(isinstance(c, ConverterSupport) for c in converters)
+                        and len(converters) > 0
+                    )
+                else:
+                    assert callable(converters), "Converter function must be callable"
+
+    def __getitem_without_validation__(self, key: Target):
+        """Get the first-found converter in any registry
+
+        Searches all registries in order and returns the first converter encountered
+        """
+        if isinstance(key, Node):
+            raise KeyError(
+                "Unvalidated accesses to the Converter registry can only be "
+                + "made with node targets. Try accessing the registry with node.target"
+            )
+
+        self.validate_invariants()
+
+        # Iterate over all registries and return the first converter found
+        for registry in self.registries:
+            if key in registry:
+                converters = registry[key]
+
+                if isinstance(converters, (list, tuple)):
+                    return converters[0].converter_implementation
+                else:
+                    return converters
+
+        raise KeyError(f"None of the converter registries have an entry for {key}")
+
+    def __getitem__(self, node: Node):
+        """Get the first-found validated converter in any registry
+
+        Searches all registries in order and returns the first converter
+        which passes validation on the input node
+        """
+        if not isinstance(node, Node):
+            raise KeyError(
+                "Validated accesses to the Converter registry can only be "
+                + "made with node inputs. Try accessing the registry with a node "
+                + "or use get_unvalidated to access without node validation."
+            )
+
+        self.validate_invariants()
+        key = node.target
+
+        # Iterate over all registries, validating the converter on the input node
+        # If no capability_validator function is found, assume full coverage
+        for registry in self.registries:
+            if key in registry:
+                converters = registry[key]
+
+                if isinstance(converters, (list, tuple)):
+                    for candidate in converters:
+                        if candidate.capability_validator(node):
+                            return candidate.converter_implementation
+                else:
+                    return converters
+
+        raise KeyError(
+            f"None of the converter registries have a validated entry for {key}, with node {node}"
+        )
+
+    def keys(self):
+        """Get all unique targets across all dictionaries"""
+        return self.unique_targets()
+
+    def get_unvalidated(self, key: Target, value=None):
+        """Get unvalidated converter for input target with a default return"""
+        try:
+            return self.__getitem_without_validation__(key)
+        except KeyError:
+            return value
+
+    def get(self, node: Node, value=None):
+        """Get validated converter for input node with a default return"""
+        try:
+            return self.__getitem__(node)
+        except KeyError:
+            return value
+
+    def __contains__(self, key: Union[Target, Node]):
+        """Check whether a converter for an input node or target exists"""
+        try:
+            # Attempt to access the item in the registry
+            if isinstance(key, Node):
+                self.__getitem__(key)
+            else:
+                self.__getitem_without_validation__(key)
+
+            return True
+        except KeyError:
+            return False
+
+    def get_all_converters_with_target(
+        self, key: Target, return_registry_info: bool = False
+    ):
+        """Get all converters across all registries for the target
+
+        Returns a list of all converterts having the specified target
+        """
+        self.validate_invariants()
+        converters_with_target = []
+
+        # Store count of number of registered converters per registry
+        if return_registry_info:
+            registry_data = {name: 0 for name in self.registry_names}
+
+        for index, registry in enumerate(self.registries):
+            if key in registry:
+                converters = registry[key]
+
+                if isinstance(converters, (list, tuple)):
+                    converters_with_target.extend(
+                        [c.converter_implementation for c in converters]
+                    )
+                    # Add converter count to registry name storage
+                    if return_registry_info:
+                        registry_data[self.registry_names[index]] += len(converters)
+                else:
+                    converters_with_target.append(converters)
+                    # Add converter count to registry name storage
+                    if return_registry_info:
+                        registry_data[self.registry_names[index]] += 1
+
+        if return_registry_info:
+            return converters_with_target, registry_data
+        else:
+            return converters_with_target
+
+    def __setitem__(self, key, value):
+        raise AssertionError(
+            f"Do not set registry members directly through the ConverterRegistry object. "
+            + f"Attempted to set {key}: {value} via direct assignment to ConverterRegistry."
+        )
+
+    def __delitem__(self, key):
+        raise AssertionError(
+            f"Do not delete registry members directly through the ConverterRegistry object. "
+            + f"Attempted to delete {key} via direct del on ConverterRegistry."
+        )
+
+    def __len__(self):
+        """Returns the sum of lengths of all registries stored"""
+        return sum(len(registry) for registry in self.registries)
+
+    def unique_targets(self):
+        """Returns the set of unique converter targets stored across all registries"""
+        return set.union(*[set(registry.keys()) for registry in self.registries])
+
+    def qualified_name_or_str(self, target: Target) -> str:
+        """Returns string representation of an FX Node target"""
+        if isinstance(target, str):
+            return target
+        else:
+            return _get_qualified_name(target)
+
+    def display_all_available_converters(self) -> str:
+        """Returns a string with all converters and their source, separated by newlines"""
+        available_converters = "Available converters in ATen registries with counts:\n"
+
+        for target in sorted(
+            self.unique_targets(), key=lambda target: self.qualified_name_or_str(target)
+        ):
+            _, registry_data = self.get_all_converters_with_target(
+                target, return_registry_info=True
+            )
+            available_converters += f"Node: {self.qualified_name_or_str(target)} - Registry Presence Counts: {registry_data}\n"
+
+        return available_converters
+
+
+# Initialize dynamo converter registry with the FX and Dynamo aten registries
+# Note the Dynamo registry is listed first, for precedence
+DYNAMO_CONVERTERS: ConverterRegistry = ConverterRegistry(
+    [DYNAMO_ATEN_CONVERTERS, CONVERTERS],
+    ["Dynamo ATen Converters Registry", "FX ATen Converters Registry"],
+)
diff --git a/py/torch_tensorrt/dynamo/lowering/_partition.py b/py/torch_tensorrt/dynamo/lowering/_partition.py
index c239dbc5b3..18d0b5a69d 100644
--- a/py/torch_tensorrt/dynamo/lowering/_partition.py
+++ b/py/torch_tensorrt/dynamo/lowering/_partition.py
@@ -10,7 +10,7 @@
 from torch.fx.node import _get_qualified_name
 from torch.fx.passes.operator_support import OperatorSupport
 
-from torch_tensorrt.fx.converter_registry import CONVERTERS
+from torch_tensorrt.dynamo import DYNAMO_CONVERTERS as CONVERTERS
 
 
 logger = logging.getLogger(__name__)
@@ -110,8 +110,8 @@ def __init__(self, support_dict=None, torch_executed_ops=set()):
         super().__init__(support_dict)
 
         # Initialize sets of supported/unsupported operators
-        self.supported_operators = set()
-        self.unsupported_operators = set()
+        self.supported_operators = {}
+        self.unsupported_operators = {}
         self.torch_executed_ops = torch_executed_ops
 
     def is_node_supported(
@@ -123,18 +123,21 @@ def is_node_supported(
             else node.target
         )
 
-        if (
-            node.target in CONVERTERS.keys()
-            and node_name not in self.torch_executed_ops
-        ):
+        if node in CONVERTERS and node_name not in self.torch_executed_ops:
             # If node is a proper, supported computational node, store the operator
             if not node.is_impure():
-                self.supported_operators.add(node_name)
+                if node_name not in self.supported_operators:
+                    self.supported_operators[node_name] = 1
+                else:
+                    self.supported_operators[node_name] += 1
 
             return True
         else:
             if not node.is_impure():
-                self.unsupported_operators.add(node_name)
+                if node_name not in self.unsupported_operators:
+                    self.unsupported_operators[node_name] = 1
+                else:
+                    self.unsupported_operators[node_name] += 1
 
             return False
 
@@ -146,15 +149,16 @@ def print_support_overview(self, num_trt_blocks: Optional[int] = None):
 
         # Reformat support messages for debugger to print node overview as a single string
         supported_nodes_str = "\nSupported Nodes:\n"
-        for node_name in self.supported_operators:
-            supported_nodes_str += f"- {node_name}\n"
+        for node_name, count in self.supported_operators.items():
+            supported_nodes_str += f"- {node_name} + Operator Count: {count}\n"
 
         logger.debug(supported_nodes_str)
 
-        if len(self.unsupported_operators) != 0:
+        if self.unsupported_operators:
             unsupported_nodes_str = "\nUnsupported or Excluded Nodes:\n"
-            for node_name in self.unsupported_operators:
-                unsupported_nodes_str += f"- {node_name}\n"
+            for node_name, count in self.unsupported_operators.items():
+                unsupported_nodes_str += f"- {node_name} + Operator Count: {count}\n"
+
             logger.debug(unsupported_nodes_str)
         else:
             logger.debug("\nAll Nodes Supported\n")
diff --git a/py/torch_tensorrt/fx/converter_registry.py b/py/torch_tensorrt/fx/converter_registry.py
index 0167f75f08..3189effd74 100644
--- a/py/torch_tensorrt/fx/converter_registry.py
+++ b/py/torch_tensorrt/fx/converter_registry.py
@@ -1,3 +1,4 @@
+import logging
 from typing import Any, Callable, Dict
 
 from torch.fx.node import Target
@@ -7,6 +8,9 @@
 NO_EXPLICIT_BATCH_DIM_SUPPORT = {}
 
 
+logger = logging.getLogger(__name__)
+
+
 def tensorrt_converter(
     key: Target,
     no_implicit_batch_dim: bool = False,
@@ -19,6 +23,13 @@ def register_converter(converter):
             NO_IMPLICIT_BATCH_DIM_SUPPORT[key] = converter
         if no_explicit_batch_dim:
             NO_EXPLICIT_BATCH_DIM_SUPPORT[key] = converter
+
+        logger.debug(
+            f"Converter for {key} added to FX Converter Registry "
+            + f"{'without' if no_explicit_batch_dim else 'with'} Explicit Batch Dim Support + "
+            + f"{'without' if no_implicit_batch_dim else 'with'} Implicit Batch Dim Support"
+        )
+
         return converter
 
     def disable_converter(converter):