# Copyright (c) Meta Platforms, Inc. and affiliates.
# All rights reserved.
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.

from typing import cast, Dict, List

import torch
from executorch.backends.xnnpack._passes.channels_last_tagged_reshape_pass import (
    ChannelsLastTaggedReshapePass,
)
from executorch.backends.xnnpack.operators.node_visitor import (
    NodeVisitor,
    register_node_visitor,
)
from executorch.backends.xnnpack.serialization.xnnpack_graph_schema import (
    XNNGraph,
    XNNStaticTranspose,
    XNode,
)
from executorch.backends.xnnpack.utils.utils import (
    check_or_raise,
    get_input_node,
    PERM_NCHW_TO_NHWC,
    PERM_NHWC_TO_NCHW,
)


@register_node_visitor
class PermuteVisitor(NodeVisitor):
    target = "aten.permute_copy.default"

    def __init__(self, *args) -> None:
        super().__init__(*args)

    def define_node(
        self,
        node: torch.fx.Node,
        xnn_graph: XNNGraph,
        vals_to_ids: Dict[torch.fx.Node, int],
        debug_handle: int,
    ) -> None:
        self.define_nodes_tensor_inputs_outputs(node, xnn_graph, vals_to_ids)

        # input
        input_node = get_input_node(node, 0)
        input_id = vals_to_ids[input_node]

        # output
        output_id = vals_to_ids[node]

        # permutation
        input_rank = input_node.meta["val"].dim()
        permute_order = cast(List[int], node.args[1])

        # Handle negative dimensions by converting them to positive indices
        permute_order = [
            (dim + input_rank) if dim < 0 else dim for dim in permute_order
        ]

        # change permute order if under channels last
        is_channels_last = node.meta.get(
            ChannelsLastTaggedReshapePass.XNN_NHWC_NODE, False
        )
        if is_channels_last:
            check_or_raise(
                len(permute_order) == 4,
                "Internal Error: Permute was tagged in channels last but is not 4D",
            )
            permute_order_in_contiguous = [PERM_NHWC_TO_NCHW[i] for i in permute_order]
            permute_order_in_channels_last = [
                permute_order_in_contiguous[i] for i in PERM_NCHW_TO_NHWC
            ]
            permute_order = permute_order_in_channels_last

        ser_node = XNode(
            xnode_union=XNNStaticTranspose(
                input_id=input_id,
                num_dims=len(permute_order),
                perm=permute_order,
                output_id=output_id,
                flags=0,
            ),
            debug_handle=debug_handle,
        )
        xnn_graph.xnodes.append(ser_node)
