[executorch] Add propagate_input_spec pass and while_loop HOP support

GregoryComer · GregoryComer · commit bfadd0c13966 · 2026-03-12T17:15:54.000-07:00
Add a new pass named `propagate_input_spec`, which recursively assigns meta["input_spec"] on placeholder nodes, including in nested control flow submodules. Placeholders that don't correspond to a top-level input are not assigned this meta key. Also, add `while_loop` to `get_control_flow_submodules`. Differential Revision: [D95876986](https://our.internmc.facebook.com/intern/diff/D95876986/) [ghstack-poisoned]
diff --git a/exir/graph_module.py b/exir/graph_module.py
@@ -78,7 +78,7 @@ def get_control_flow_submodules(
 ) -> List[Tuple[str, torch.fx.GraphModule, torch.fx.Node]]:
     """
     Returns a list of submodules used for control flow operations
-    (torch.ops.higher_order.cond/map/scan) that are in the given toplevel graph (does not look
+    (torch.ops.higher_order.cond/map/scan/while_loop) that are in the given toplevel graph (does not look
     into submodules). Specifically, the returned value is a list containing
     tuples of (name of the submodule that's stored in the graph module, the
     submodule itself, and the fx node that uses this submodule).
@@ -89,6 +89,7 @@ def get_control_flow_submodules(
             torch.ops.higher_order.cond: [1, 2],
             torch.ops.higher_order.map_impl: [0],
             torch.ops.higher_order.scan: [0],  # combine_fn is at arg index 0
+            torch.ops.higher_order.while_loop: [0, 1],
         },
     )
 
diff --git a/exir/passes/BUCK b/exir/passes/BUCK
@@ -407,6 +407,16 @@ fbcode_target(_kind = runtime.python_library,
     ],
 )
 
+fbcode_target(_kind = runtime.python_library,
+    name = "propagate_input_spec",
+    srcs = [
+        "propagate_input_spec.py",
+    ],
+    deps = [
+        "//caffe2:torch",
+    ],
+)
+
 fbcode_target(_kind = runtime.python_library,
     name = "remove_unused_parameters_pass",
     srcs = [
diff --git a/exir/passes/propagate_input_spec.py b/exir/passes/propagate_input_spec.py
@@ -0,0 +1,151 @@
+# This pass exists to propagate input spec metadata down through nested
+# submodules. Specifically, metadata for the type of tensor - USER_INPUT, PARAM,
+# BUFFER, corresponding to torch.export.graph_signature.InputKind. If the tensor
+# is not a direct input in all paths, it's left left as None.
+#
+# Metadata is stored in the node meta["input_spec"] with a type of
+# torch.export.graph_signature.InputSpec or None. It corresponds to the output
+# value of the node, and can be a tuple for nodes that return tuples.
+#
+# After this pass runs, it should be present on all nodes, including arbitrarily
+# nested submodules. This may become stale if the graph is mutated, though.
+
+from typing import Any, Sequence
+
+import torch
+
+from torch.export import ExportedProgram
+from torch.export.graph_signature import InputSpec
+from torch.fx import GraphModule, Node
+
+# Key for node.meta dict.
+INPUT_SPEC_KEY = "input_spec"
+
+
+def propagate_input_spec(ep: ExportedProgram) -> ExportedProgram:
+    """
+    Assign the meta["input_spec"] value for placeholders in the graph, including
+    placeholder nodes in control flow submodules.
+    """
+    # Clear any stale input_spec metadata before propagating fresh values.
+    # Passes like duplicate_constant_node copy all metadata (including
+    # input_spec) to new nodes, leaving stale specs that don't match the
+    # updated EP signature.
+    _clear_input_spec_recursive(ep.graph_module)
+
+    inputs = {s.arg.name: s for s in ep.graph_signature.input_specs}
+    _propagate_input_spec_recursive(ep.graph_module, inputs)
+
+
+def _clear_input_spec_recursive(gm: GraphModule) -> None:
+    for node in gm.graph.nodes:
+        if node.op == "placeholder":
+            node.meta.pop(INPUT_SPEC_KEY, None)
+    for _, child in gm.named_children():
+        if isinstance(child, GraphModule):
+            _clear_input_spec_recursive(child)
+
+
+def _collect_node_arg_specs(args: Sequence[Any]) -> list[InputSpec | None]:
+    """
+    Retrieve the input spec for each node arg.
+    """
+    return [
+        n.meta.get(INPUT_SPEC_KEY, None) if hasattr(n, "meta") else None for n in args
+    ]
+
+
+def _propagate_input_spec_recursive(
+    gm: GraphModule, inputs: dict[str, InputSpec] | Sequence[InputSpec]
+) -> None:
+    """
+    Given a dictionary or list of InputSpecs for graph inputs, propagate the specs
+    to any nested submodules.
+    """
+    # Submodules don't have graph signatures, so we need to reconstruct the
+    # placeholder -> spec mapping based on placeholder node order.
+    if not isinstance(inputs, dict):
+        input_dict = {}
+
+        # This relies on placeholder node order matching graph inputs - but
+        # this seems to be an implicit contract that pytorch already uses...
+        for node in gm.graph.nodes:
+            if node.op == "placeholder":
+                input_dict[node.target] = inputs[len(input_dict)]
+
+        inputs = input_dict
+
+    for node in gm.graph.nodes:
+        if node.op == "placeholder":
+            _update_placeholder_meta(node, inputs)
+        elif node.target == torch.ops.higher_order.cond:
+            _update_cond_meta(node, inputs)
+        elif node.target == torch.ops.higher_order.map_impl:
+            _update_map_meta(node, inputs)
+        elif node.target == torch.ops.higher_order.scan:
+            _update_scan_meta(node, inputs)
+        elif node.target == torch.ops.higher_order.while_loop:
+            _update_while_loop_meta(node, inputs)
+
+
+def _update_placeholder_meta(node: Node, inputs: dict[str, InputSpec]) -> None:
+    spec = inputs.get(node.target, None)
+
+    if spec is not None:
+        node.meta[INPUT_SPEC_KEY] = spec
+    else:
+        node.meta.pop(INPUT_SPEC_KEY, None)
+
+
+def _update_cond_meta(node: Node, inputs: dict[str, InputSpec]) -> None:
+    _, true_submodule_node, false_submodule_node, submodule_inputs = node.args
+    submodule_input_specs = _collect_node_arg_specs(submodule_inputs)
+
+    # Resolve get_attr nodes to actual submodules
+    gm = node.graph.owning_module
+    true_submodule = getattr(gm, true_submodule_node.target)
+    false_submodule = getattr(gm, false_submodule_node.target)
+
+    _propagate_input_spec_recursive(true_submodule, submodule_input_specs)
+    _propagate_input_spec_recursive(false_submodule, submodule_input_specs)
+
+
+def _update_map_meta(node: Node, inputs: dict[str, InputSpec]) -> None:
+    f_node, mapped_args, operands = node.args
+    mapped_arg_specs = _collect_node_arg_specs(mapped_args)
+    operand_specs = _collect_node_arg_specs(operands)
+    submodule_input_specs = mapped_arg_specs + operand_specs
+
+    # Resolve get_attr node to actual submodule
+    gm = node.graph.owning_module
+    f = getattr(gm, f_node.target)
+
+    _propagate_input_spec_recursive(f, submodule_input_specs)
+
+
+def _update_while_loop_meta(node: Node, inputs: dict[str, InputSpec]) -> None:
+    cond_fn_node, body_fn_node, carried_inputs, additional_inputs = node.args
+    carried_specs = _collect_node_arg_specs(carried_inputs)
+    additional_specs = _collect_node_arg_specs(additional_inputs)
+    submodule_input_specs = carried_specs + additional_specs
+
+    gm = node.graph.owning_module
+    cond_fn = getattr(gm, cond_fn_node.target)
+    body_fn = getattr(gm, body_fn_node.target)
+
+    _propagate_input_spec_recursive(cond_fn, submodule_input_specs)
+    _propagate_input_spec_recursive(body_fn, submodule_input_specs)
+
+
+def _update_scan_meta(node: Node, inputs: dict[str, InputSpec]) -> None:
+    combine_fn_node, init, xs, additional_inputs = node.args
+    init_specs = _collect_node_arg_specs(init)
+    xs_specs = _collect_node_arg_specs(xs)
+    additional_input_specs = _collect_node_arg_specs(additional_inputs)
+    submodule_input_specs = init_specs + xs_specs + additional_input_specs
+
+    # Resolve get_attr node to actual submodule
+    gm = node.graph.owning_module
+    combine_fn = getattr(gm, combine_fn_node.target)
+
+    _propagate_input_spec_recursive(combine_fn, submodule_input_specs)
diff --git a/exir/program/BUCK b/exir/program/BUCK
@@ -40,6 +40,7 @@ fbcode_target(_kind = runtime.python_library,
         "//executorch/exir/passes:insert_write_back_for_buffers_pass",
         "//executorch/exir/passes:lib",
         "//executorch/exir/passes:normalize_view_copy_base_pass",
+        "//executorch/exir/passes:propagate_input_spec",
         "//executorch/exir/passes:remove_graph_asserts_pass",
         "//executorch/exir/passes:remove_mixed_type_operators",
         "//executorch/exir/passes:replace_aten_with_edge_pass",
diff --git a/exir/program/_program.py b/exir/program/_program.py
@@ -59,6 +59,7 @@
 from executorch.exir.passes.normalize_view_copy_base_pass import (
     NormalizeViewCopyBasePass,
 )
+from executorch.exir.passes.propagate_input_spec import propagate_input_spec
 from executorch.exir.passes.quant_fusion_pass import quant_fusion_and_const_prop_pass
 from executorch.exir.passes.reinplace import reinplace_pass
 from executorch.exir.passes.remove_graph_asserts_pass import (
@@ -912,6 +913,9 @@ def _generate_edge_program(
         ],
     )
 
+    # Recursively tag placeholder nodes in submodules with input specs.
+    propagate_input_spec(edge_program)
+
     # Lift the tensor constants created in ScalarToTensorPass
     edge_program = lift_constant_tensor_pass(edge_program)
 
@@ -1232,6 +1236,11 @@ def _gen_edge_manager_for_partitioners(
                     # First pass of decompositions with this partitioner's preserved ops
                     program = program.run_decompositions(table)
 
+                    # Propagate input specs so that check_constraints
+                    # can identify parameter nodes inside control flow
+                    # submodules (e.g. cond/map/scan branches).
+                    propagate_input_spec(program)
+
                     # Filter ops using EDGE_DO_NOT_DECOMP
                     temp_partitioner_dict = {name: [curr_partitioner]}
                     preserved_ops = (
diff --git a/exir/tests/__init__.py b/exir/tests/__init__.py
diff --git a/exir/tests/test_passes.py b/exir/tests/test_passes.py