Refine literal comprehension sugar behavior and docs

gordonwatts · gordonwatts · commit a3d91bee3de9 · 2026-02-12T23:17:25.000-06:00
diff --git a/README.md b/README.md
@@ -57,13 +57,18 @@ There are several python expressions and idioms that are translated behind your
 --- | --- | --- |
 |List Comprehension | `[j.pt() for j in jets]` | `jets.Select(lambda j: j.pt())` |
 |List Comprehension | `[j.pt() for j in jets if abs(j.eta()) < 2.4]` | `jets.Where(lambda j: abs(j.eta()) < 2.4).Select(lambda j: j.pt())` |
+|Literal List Comprehension|`[i for i in [1, 2, 3]]`|`[1, 2, 3]`|
 | Data Classes<br>(typed) | `@dataclass`<br>`class my_data:`<br>`x: ObjectStream[Jets]`<br><br>`Select(lambda e: my_data(x=e.Jets()).x)` | `Select(lambda e: {'x': e.Jets()}.x)` |
 | Named Tuple<br>(typed) | `class my_data(NamedTuple):`<br>`x: ObjectStream[Jets]`<br><br>`Select(lambda e: my_data(x=e.Jets()).x)` | `Select(lambda e: {'x': e.Jets()}.x)` |
 |List Membership|`p.absPdgId() in [35, 51]`|`p.absPdgId() == 35 or p.absPdgId() == 51`|
-| `any`/`all` | `any(e.pt()>10, abs(e.eta()) < 2.5` | `e.pt() > 10 | abs(e.eta()) < 2.5` |
+| `any`/`all` | `any([e.pt() > 10, abs(e.eta()) < 2.5])` | `e.pt() > 10 or abs(e.eta()) < 2.5` |
 
 Note: Everything that goes for a list comprehension also goes for a generator expression.
 
+For `any`/`all`, generator/list comprehensions over a literal (or captured literal constant)
+are first expanded to a literal list and then reduced as usual. For example,
+`any(f(a) for a in [1, 2])` is treated like `any([f(1), f(2)])`.
+
 ## Extensibility
 
 There are two several extensibility points:
diff --git a/docs/source/generic/query_structure.md b/docs/source/generic/query_structure.md
@@ -34,3 +34,15 @@ This can be continued to deeper and deeper levels within the data. For example,
 
 Due to the flexible nature of FuncADL there are multiple ways to structure each query. Throughout this documentation different structures will be used for the sake of demonstration.
 
+## Syntatic Sugar
+
+Inside query lambdas, FuncADL also rewrites a few common Python forms into query-friendly
+expressions:
+
+- List/generator comprehensions over streams are lowered to `.Where(...)`/`.Select(...)`.
+- List comprehensions over literal iterables are expanded directly. For example,
+  `[i for i in [1, 2, 3]]` becomes `[1, 2, 3]`.
+- `any`/`all` over literal lists/tuples are reduced to boolean `or`/`and` expressions.
+
+This means patterns like `any(expr(x) for x in LITERAL_LIST)` can be simplified in-query,
+as long as the iterable is a literal (or a captured literal constant).
diff --git a/func_adl/ast/syntatic_sugar.py b/func_adl/ast/syntatic_sugar.py
@@ -2,9 +2,10 @@
 import copy
 import inspect
 from dataclasses import is_dataclass
-from typing import Any, List, Optional
+from itertools import product
+from typing import Any, Dict, List, Optional, Tuple
 
-from func_adl.util_ast import lambda_build
+from func_adl.util_ast import as_ast, lambda_build
 
 
 def resolve_syntatic_sugar(a: ast.AST) -> ast.AST:
@@ -22,6 +23,118 @@ def resolve_syntatic_sugar(a: ast.AST) -> ast.AST:
     """
 
     class syntax_transformer(ast.NodeTransformer):
+        def _extract_literal_iterable(self, node: ast.AST) -> Optional[List[ast.expr]]:
+            """Return literal iterable elements if ``node`` is a list/tuple literal."""
+
+            if isinstance(node, (ast.List, ast.Tuple)):
+                return list(node.elts)
+            if isinstance(node, ast.Constant) and isinstance(node.value, (list, tuple)):
+                return [as_ast(v) for v in node.value]
+            return None
+
+        def _target_bindings(
+            self, target: ast.AST, value: ast.AST, node: ast.AST
+        ) -> Optional[Dict[str, ast.expr]]:
+            """Build loop-variable bindings for a single comprehension iteration.
+
+            Returns ``None`` when destructuring cannot be applied for this ``value``.
+            """
+
+            if isinstance(target, ast.Name):
+                return {target.id: copy.deepcopy(value)}
+
+            if isinstance(target, (ast.Tuple, ast.List)):
+                if not isinstance(value, (ast.Tuple, ast.List)):
+                    return None
+                if len(target.elts) != len(value.elts):
+                    raise ValueError(
+                        "Comprehension unpacking length mismatch" f" - {ast.unparse(node)}"
+                    )
+
+                bindings: Dict[str, ast.expr] = {}
+                for target_elt, value_elt in zip(target.elts, value.elts):
+                    child_bindings = self._target_bindings(target_elt, value_elt, node)
+                    if child_bindings is None:
+                        return None
+                    bindings.update(child_bindings)
+                return bindings
+
+            raise ValueError(
+                f"Comprehension variable must be a name or tuple/list, but found {target}"
+                f" - {ast.unparse(node)}"
+            )
+
+        def _substitute_names(self, expr: ast.expr, bindings: Dict[str, ast.expr]) -> ast.expr:
+            class _name_replacer(ast.NodeTransformer):
+                def __init__(self, loop_bindings: Dict[str, ast.expr]):
+                    self._loop_bindings = loop_bindings
+
+                def visit_Name(self, replace_node: ast.Name) -> Any:
+                    if (
+                        isinstance(replace_node.ctx, ast.Load)
+                        and replace_node.id in self._loop_bindings
+                    ):
+                        return copy.deepcopy(self._loop_bindings[replace_node.id])
+                    return replace_node
+
+            return _name_replacer(bindings).visit(copy.deepcopy(expr))
+
+        def _inline_literal_comprehension(
+            self, lambda_body: ast.expr, generators: List[ast.comprehension], node: ast.AST
+        ) -> Optional[List[ast.expr]]:
+            """Expand comprehensions over literal iterables into literal expressions."""
+
+            literal_values: List[List[Tuple[Dict[str, ast.expr], List[ast.expr]]]] = []
+            for generator in generators:
+                if generator.is_async:
+                    raise ValueError(f"Comprehension can't be async - {ast.unparse(node)}.")
+
+                iter_values = self._extract_literal_iterable(generator.iter)
+                if iter_values is None:
+                    return None
+
+                generator_values: List[Tuple[Dict[str, ast.expr], List[ast.expr]]] = []
+                for iter_value in iter_values:
+                    bindings = self._target_bindings(generator.target, iter_value, node)
+                    if bindings is None:
+                        return None
+                    generator_values.append((bindings, generator.ifs))
+                literal_values.append(generator_values)
+
+            if len(literal_values) == 0:
+                return []
+
+            expanded: List[ast.expr] = []
+            for combo in product(*literal_values):
+                merged_bindings: Dict[str, ast.expr] = {}
+                all_ifs: List[ast.expr] = []
+                for c_bindings, c_ifs in combo:
+                    merged_bindings.update(c_bindings)
+                    all_ifs.extend(c_ifs)
+
+                include_item = True
+                for if_clause in all_ifs:
+                    rendered_if = self.visit(self._substitute_names(if_clause, merged_bindings))
+                    if not isinstance(rendered_if, ast.Constant) or not isinstance(
+                        rendered_if.value, bool
+                    ):
+                        raise ValueError(
+                            "Literal comprehension if-clause must resolve to a bool constant"
+                            f" - {ast.unparse(if_clause)}"
+                        )
+                    if not rendered_if.value:
+                        include_item = False
+                        break
+
+                if include_item:
+                    rendered_item = self.visit(
+                        self._substitute_names(lambda_body, merged_bindings)
+                    )
+                    assert isinstance(rendered_item, ast.expr)
+                    expanded.append(rendered_item)
+
+            return expanded
+
         def _resolve_any_all_call(
             self, call_node: ast.Call, source_node: ast.AST
         ) -> Optional[ast.AST]:
@@ -44,6 +157,8 @@ def _resolve_any_all_call(
                 )
 
             sequence = call_node.args[0]
+            if isinstance(sequence, (ast.ListComp, ast.GeneratorExp)):
+                return None
             if not isinstance(sequence, (ast.List, ast.Tuple)):
                 raise ValueError(
                     f"{func_name} requires a list or tuple literal argument"
@@ -77,10 +192,8 @@ def resolve_generator(
             for c in reversed(generators):
                 target = c.target
                 if not isinstance(target, ast.Name):
-                    raise ValueError(
-                        f"Comprehension variable must be a name, but found {target}"
-                        f" - {ast.unparse(node)}."
-                    )
+                    # Keep original comprehension for unsupported lowering cases.
+                    return node
                 if c.is_async:
                     raise ValueError(f"Comprehension can't be async - {ast.unparse(node)}.")
                 source_collection = c.iter
@@ -110,6 +223,10 @@ def visit_ListComp(self, node: ast.ListComp) -> Any:
             a = self.generic_visit(node)
 
             if isinstance(a, ast.ListComp):
+                if (
+                    expanded := self._inline_literal_comprehension(a.elt, a.generators, node)
+                ) is not None:
+                    return ast.List(elts=expanded, ctx=ast.Load())
                 a = self.resolve_generator(a.elt, a.generators, node)
 
             return a
@@ -119,6 +236,10 @@ def visit_GeneratorExp(self, node: ast.GeneratorExp) -> Any:
             a = self.generic_visit(node)
 
             if isinstance(a, ast.GeneratorExp):
+                if (
+                    expanded := self._inline_literal_comprehension(a.elt, a.generators, node)
+                ) is not None:
+                    return ast.List(elts=expanded, ctx=ast.Load())
                 a = self.resolve_generator(a.elt, a.generators, node)
 
             return a
diff --git a/tests/ast/test_syntatic_sugar.py b/tests/ast/test_syntatic_sugar.py
@@ -30,6 +30,13 @@ def test_resolve_generator():
     assert ast.dump(ast.parse("jets.Select(lambda j: j.pt())")) == ast.dump(a_new)
 
 
+def test_resolve_literal_list_comp():
+    a = ast.parse("[i for i in [1, 2, 3]]")
+    a_new = resolve_syntatic_sugar(a)
+
+    assert ast.dump(ast.parse("[1, 2, 3]")) == ast.dump(a_new)
+
+
 def test_resolve_listcomp_if():
     a = ast.parse("[j.pt() for j in jets if j.pt() > 100]")
     a_new = resolve_syntatic_sugar(a)
@@ -62,11 +69,11 @@ def test_resolve_2generator():
 
 def test_resolve_bad_iterator():
     a = ast.parse("[j.pt() for idx,j in enumerate(jets)]")
+    a_new = resolve_syntatic_sugar(a)
 
-    with pytest.raises(ValueError) as e:
-        resolve_syntatic_sugar(a)
-
-    assert "name" in str(e)
+    # Unsupported lowering (tuple target with non-literal source) should be
+    # preserved for downstream processing.
+    assert ast.unparse(a_new) == ast.unparse(a)
 
 
 def test_resolve_no_async():
@@ -396,3 +403,21 @@ def test_resolve_any_requires_literal_sequence():
 
     with pytest.raises(ValueError, match="list or tuple literal"):
         resolve_syntatic_sugar(a)
+
+
+def test_resolve_any_generator_from_literal_capture():
+    bib_triggers = [(1, 2), (3, 4)]
+
+    def tdt_chain_fired(chain: int) -> bool:
+        return chain > 1
+
+    a = parse_as_ast(
+        lambda e: any(
+            tdt_chain_fired(incl_trig) and not tdt_chain_fired(bib_trig)
+            for incl_trig, bib_trig in bib_triggers
+        )
+    )
+    a_resolved = resolve_syntatic_sugar(a)
+
+    a_expected = ast.parse("lambda e: (1 > 1 and not (2 > 1)) or (3 > 1 and not (4 > 1))")
+    assert ast.unparse(a_resolved) == ast.unparse(a_expected)