Source code for aitemplate.compiler.transform.name_graph

#  Copyright (c) Meta Platforms, Inc. and affiliates.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#
"""
Graph pass to assign names to a sorted graph.
"""

import logging
import re
from typing import List

from aitemplate.compiler.base import IntImm, IntVar, IntVarTensor, JaggedIntVar, Tensor
from aitemplate.utils import graph_utils

_LOGGER = logging.getLogger(__name__)

# pylint: disable=C0103

# Make these variables global to allow repeately calling name_graph().
func_cnt = 0
tensor_cnt = 0
func_name_to_tensor_cnt = {}

MEMO = set()
user_provided_dim = set()


def reset_name_counters():
    global func_cnt
    global tensor_cnt
    global func_name_to_tensor_cnt
    global MEMO
    func_cnt = 0
    tensor_cnt = 0
    func_name_to_tensor_cnt = {}
    MEMO = set()


def valid_c_name(name):
    return re.sub(r"\W|^(?=\d)", "_", name)


def unique_name(name):
    name = valid_c_name(name)
    global MEMO
    if name in MEMO:
        return f"{name}_{str(len(MEMO))}"
    else:
        MEMO.add(name)
        return name


[docs]def name_graph(sorted_graph: List[Tensor]) -> None:
    """Provide each tensor and operator with a unique valid C variable name

    Parameters
    ----------
    sorted_graph : List[Tensor]
        Input graph to be named
    reset_counters : bool
        If True, reset counters which are used to name tensors and functions. (Default: False)
    """
    global func_cnt
    global tensor_cnt
    global func_name_to_tensor_cnt
    global user_provided_dim

    _LOGGER.debug(
        f"before name_graph: {func_cnt=}, {tensor_cnt=}, {len(func_name_to_tensor_cnt)=}, {len(user_provided_dim)=}"
    )
    for node in sorted_graph:
        funcs = node.src_ops()
        if len(funcs) == 0:
            if node._attrs["name"] is None:
                tensor_name = unique_name(f"tensor_{tensor_cnt}")
                node._attrs["name"] = tensor_name
                tensor_cnt += 1
                if isinstance(node, IntVarTensor):
                    if not isinstance(node._attrs["int_var"], IntImm):
                        # TODO: emit standalone dynamic shape initialization for IntVarTensor
                        raise RuntimeError(
                            "We don't support emitting standalone IntVarTensor at this moment.\n"
                            f"Encountered {node._attrs['name']}: {node._attrs['int_var']}."
                        )
                    else:
                        node._attrs["int_var"]._attrs["name"] = tensor_name

        else:
            for func in funcs:
                if func._attrs["name"] is None:
                    func_name = "{op_kind}_{idx}".format(
                        op_kind=func._attrs["op"], idx=func_cnt
                    )
                    func_name = unique_name(func_name)
                    func._attrs["name"] = func_name
                    func._attrs["original_name"] = func_name
                    func_cnt += 1
                    func_name_to_tensor_cnt[func_name] = 0
                if node._attrs["name"] is None:
                    func_tensor_count = func_name_to_tensor_cnt[func_name]
                    node_name = unique_name(f"{func_name}_{func_tensor_count}")
                    node._attrs["name"] = node_name
                    func_name_to_tensor_cnt[func_name] = func_tensor_count + 1
                    if isinstance(node, IntVarTensor):
                        shape_name = node._attrs["int_var"]._attrs["name"]
                        if shape_name is None:
                            node._attrs["int_var"]._attrs["name"] = node_name

        tensor_name = node._attrs["name"]
        for i, dim in enumerate(node._attrs["shape"]):
            if dim._attrs["name"] is not None:
                user_provided_dim.add(dim._attrs["name"])
            if dim._attrs["name"] is None and not isinstance(dim, JaggedIntVar):
                dim_name = "{tname}_dim_{idx}".format(tname=tensor_name, idx=i)
                dim._attrs["name"] = dim_name

    for tensor in sorted_graph:
        if tensor.is_jagged():
            jagged_int_var = tensor._attrs["shape"][0]
            # JaggedIntVar's name must be the same as the name of the total_length IntVar
            # that it is based on. Due to the fact that IntVar's _attrs["name"] is accessed
            # directly throughout the code, we can't enforce this constrain by overloading
            # the name in the JaggedIntVar class. as a result, we must resort to a hack here
            # to reset the name of the JaggedIntVar to the name of the total_length after
            # the latter might have been changed (e.g., from None) by the code above.
            # TODO (T146653032): wrap _attrs["name"] (and other frequently used _attrs
            # members) in @properties and override the "name" property in the JaggedIntVar
            # to return total_length().name.
            jagged_int_var._attrs["name"] = jagged_int_var.total_length()._attrs["name"]

            batch_dim = jagged_int_var.batch_dim()
            if batch_dim._attrs["name"] is None:
                # the batch_dim wasn't named above, so we name it here
                jagged_int_var_name = jagged_int_var._attrs["name"]
                batch_dim._attrs["name"] = f"{jagged_int_var_name}_jagged_batch_dim"

    _LOGGER.debug(
        f"after name_graph: {func_cnt=}, {tensor_cnt=}, {len(func_name_to_tensor_cnt)=}, {len(user_provided_dim)=}"
    )


[docs]def dedup_symbolic_name(sorted_graph: List[Tensor]) -> None:
    """Rename all shape variable that are identical to the same name.
    Parameters
    ----------
    sorted_graph : List[Tensor]
        Input graph to be simplified
    """
    symbolic_to_name = {}
    global user_provided_dim
    # First pass - build symbolic_to_name map
    for i, dim in _all_dims_in_graph(sorted_graph):
        if not _dim_qualified_for_sym_dedup(dim):
            continue
        dim_sym = dim.symbolic_value()
        if (
            dim_sym not in symbolic_to_name
            or dim_sym in symbolic_to_name
            and dim._attrs["name"] in user_provided_dim
        ):
            symbolic_to_name[dim_sym] = dim._attrs["name"] or f"dim_{i}"

    # Second pass - use symbolic_to_name map
    for _, dim in _all_dims_in_graph(sorted_graph):
        if not _dim_qualified_for_sym_dedup(dim):
            continue
        dim_sym = dim.symbolic_value()
        dim._attrs["name"] = symbolic_to_name[dim_sym]


def _all_dims_in_graph(sorted_graph: List[Tensor]):
    dim_idx = 0
    for node in sorted_graph:
        for dim in node._attrs["shape"]:
            yield dim_idx, dim
            dim_idx += 1

    # In case some dimensions are not encountered in any nodes in the graph,
    # only in input/output accessors - iterate over all ops and dimensions
    # in tensor accessors, if any.
    sorted_ops = graph_utils.get_sorted_ops(sorted_graph)
    for op in sorted_ops:
        input_accessors = op._attrs.get("input_accessors", None)
        output_accessors = op._attrs.get("output_accessors", None)
        for accessors in (input_accessors, output_accessors):
            if accessors is None:
                continue
            for ta in accessors:
                if ta.original_shapes:
                    for dim in ta.original_shapes:
                        yield dim_idx, dim
                        dim_idx += 1


def _dim_qualified_for_sym_dedup(dim: IntVar) -> bool:
    return not isinstance(dim, IntImm) and not isinstance(dim, JaggedIntVar)