elastic · bpintea · Jan 29, 2026 · Jan 26, 2026 · Jan 26, 2026 · Jan 26, 2026
diff --git a/docs/changelog/141262.yaml b/docs/changelog/141262.yaml
@@ -0,0 +1,5 @@
+pr: 141262
+summary: Fix injected attributes's IDs in `UnionAll` branches
+area: ES|QL
+type: bug
+issues: []
diff --git a/x-pack/plugin/esql/qa/testFixtures/src/main/resources/unmapped-nullify.csv-spec b/x-pack/plugin/esql/qa/testFixtures/src/main/resources/unmapped-nullify.csv-spec
@@ -58,6 +58,20 @@ avg_worked_seconds:long|birth_date:date|emp_no:integer|first_name:keyword|gender
 268728049         |1953-09-02T00:00:00.000Z|10001          |Georgi         |M              |2.03           |2.0299999713897705|2.029296875      |2.03               |1986-06-26T00:00:00.000Z|[false, true]  |[Accountant, Senior Python Developer]|2              |2              |2              |2              |Facello        |57305          |1.19           |1                |1.19                 |1                 |true           |null |null
 ;
 
+keepFieldStarEval
+required_capability: optional_fields_nullify_tech_preview
+
+SET unmapped_fields="nullify"\;
+FROM employees
+| KEEP emp_no, *
+| EVAL foo = does_not_exist_field + 1
+| SORT emp_no
+| LIMIT 1
+;
+
+emp_no:integer|avg_worked_seconds:long|birth_date:date         |first_name:keyword|gender:keyword|height:double|height.float:double|height.half_float:double|height.scaled_float:double|hire_date:date          |is_rehired:boolean|job_positions:keyword                |languages:integer|languages.byte:integer|languages.long:long|languages.short:integer|last_name:keyword|salary:integer|salary_change:double|salary_change.int:integer|salary_change.keyword:keyword|salary_change.long:long|still_hired:boolean|does_not_exist_field:null|foo:integer
+10001         |268728049              |1953-09-02T00:00:00.000Z|Georgi            |M             |2.03         |2.0299999713897705 |2.029296875             |2.03                      |1986-06-26T00:00:00.000Z|[false, true]     |[Accountant, Senior Python Developer]|2                |2                     |2                  |2                      |Facello          |57305         |1.19                |1                        |1.19                         |1                      |true               |null                     |null
+;
 
 dropPatternSimpleKeep
 required_capability: optional_fields_nullify_tech_preview

diff --git a/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java b/x-pack/plugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/Analyzer.java
@@ -181,6 +181,7 @@
 import static java.util.Collections.singletonList;
 import static org.elasticsearch.xpack.core.enrich.EnrichPolicy.GEO_MATCH_TYPE;
 import static org.elasticsearch.xpack.esql.capabilities.TranslationAware.translatable;
+import static org.elasticsearch.xpack.esql.core.expression.Expressions.toReferenceAttributes;
 import static org.elasticsearch.xpack.esql.core.type.DataType.AGGREGATE_METRIC_DOUBLE;
 import static org.elasticsearch.xpack.esql.core.type.DataType.BOOLEAN;
 import static org.elasticsearch.xpack.esql.core.type.DataType.DATETIME;
@@ -1025,17 +1026,7 @@ private LogicalPlan resolveFork(Fork fork) {
                 return fork;
             }
 
-            List<Attribute> newOutput = new ArrayList<>();
-
-            // We don't want to keep the same attributes that are outputted by the FORK branches.
-            // Keeping the same attributes can have unintended side effects when applying optimizations like constant folding.
-            for (Attribute attr : outputUnion) {
-                newOutput.add(
-                    new ReferenceAttribute(attr.source(), null, attr.name(), attr.dataType(), Nullability.FALSE, null, attr.synthetic())
-                );
-            }
-
-            return fork.replaceSubPlansAndOutput(newSubPlans, newOutput);
+            return fork.replaceSubPlansAndOutput(newSubPlans, toReferenceAttributes(outputUnion));
         }
 
         private LogicalPlan resolveRerank(Rerank rerank, List<Attribute> childrenOutput, AnalyzerContext context) {
@@ -2741,16 +2732,18 @@ private static LogicalPlan maybePushDownConvertFunctions(
                 List<Attribute> newChildOutput = new ArrayList<>(childOutput.size());
                 for (Attribute oldAttr : childOutput) {
                     newChildOutput.add(oldAttr);
-                    if (oldOutputToConvertFunctions.containsKey(oldAttr.name())) {
-                        Set<AbstractConvertFunction> converts = oldOutputToConvertFunctions.get(oldAttr.name());
+                    Set<AbstractConvertFunction> converts = oldOutputToConvertFunctions.get(oldAttr.name());
+                    if (converts != null) {
                         // create a new alias for each conversion function and add it to the new aliases list
                         for (AbstractConvertFunction convert : converts) {
                             // create a new alias for the conversion function
                             String newAliasName = Attribute.rawTemporaryName(oldAttr.name(), "converted_to", convert.dataType().typeName());
                             Alias newAlias = new Alias(
                                 oldAttr.source(),
                                 newAliasName, // oldAttrName$$converted_to$$targetType
-                                convert.replaceChildren(Collections.singletonList(oldAttr))
+                                convert.replaceChildren(Collections.singletonList(oldAttr)),
+                                null, // generate a new id
+                                true // this'll be used to Project the synthetic attributes out when finishing analysis
                             );
                             newAliases.add(newAlias);
                             newChildOutput.add(newAlias.toAttribute());

diff --git a/...lugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/rules/ResolveUnmapped.java b/...lugin/esql/src/main/java/org/elasticsearch/xpack/esql/analysis/rules/ResolveUnmapped.java
@@ -19,6 +19,7 @@
 import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
 import org.elasticsearch.xpack.esql.core.expression.Literal;
 import org.elasticsearch.xpack.esql.core.expression.NameId;
+import org.elasticsearch.xpack.esql.core.expression.NamedExpression;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedAttribute;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedPattern;
 import org.elasticsearch.xpack.esql.core.expression.UnresolvedTimestamp;
@@ -28,7 +29,6 @@
 import org.elasticsearch.xpack.esql.plan.logical.Eval;
 import org.elasticsearch.xpack.esql.plan.logical.Fork;
 import org.elasticsearch.xpack.esql.plan.logical.LeafPlan;
-import org.elasticsearch.xpack.esql.plan.logical.Limit;
 import org.elasticsearch.xpack.esql.plan.logical.LogicalPlan;
 import org.elasticsearch.xpack.esql.plan.logical.Project;
 import org.elasticsearch.xpack.esql.plan.logical.Row;
@@ -44,6 +44,7 @@
 
 import static org.elasticsearch.xpack.esql.analysis.Analyzer.ResolveRefs.insistKeyword;
 import static org.elasticsearch.xpack.esql.core.util.CollectionUtils.combine;
+import static org.elasticsearch.xpack.esql.expression.NamedExpressions.mergeOutputAttributes;
 
 /**
  * The rule handles fields that don't show up in the index mapping, but are used within the query. These fields can either be missing
@@ -81,8 +82,9 @@ private static LogicalPlan resolve(LogicalPlan plan, boolean load) {
         if (unresolved.isEmpty()) {
             return plan;
         }
+        var unresolvedLinkedSet = unresolvedLinkedSet(unresolved);
 
-        var transformed = load ? load(plan, unresolved) : nullify(plan, unresolved);
+        var transformed = load ? load(plan, unresolvedLinkedSet) : nullify(plan, unresolvedLinkedSet);
 
         return transformed.equals(plan) ? plan : refreshPlan(transformed, unresolved);
     }
@@ -91,21 +93,17 @@ private static LogicalPlan resolve(LogicalPlan plan, boolean load) {
      * The method introduces {@code EVAL missing_field = NULL}-equivalent into the plan, on top of the source, for every attribute in
      * {@code unresolved}. It also "patches" the introduced attributes through the plan, where needed (like through Fork/UntionAll).
      */
-    private static LogicalPlan nullify(LogicalPlan plan, List<UnresolvedAttribute> unresolved) {
-        var nullAliases = nullAliases(unresolved);
-
+    private static LogicalPlan nullify(LogicalPlan plan, Set<UnresolvedAttribute> unresolved) {
         // insert an Eval on top of every LeafPlan, if there's a UnaryPlan atop it
         var transformed = plan.transformUp(
             n -> n instanceof UnaryPlan unary && unary.child() instanceof LeafPlan,
-            p -> evalUnresolvedUnary((UnaryPlan) p, nullAliases)
+            p -> evalUnresolvedAtopUnary((UnaryPlan) p, nullAliases(unresolved))
         );
         // insert an Eval on top of those LeafPlan that are children of n-ary plans (could happen with UnionAll)
-        transformed = transformed.transformUp(
+        return transformed.transformUp(
             n -> n instanceof UnaryPlan == false && n instanceof LeafPlan == false,
-            nAry -> evalUnresolvedNary(nAry, nullAliases)
+            nAry -> evalUnresolvedAtopNary(nAry, nullAliases(unresolved))
         );
-
-        return transformed.transformUp(Fork.class, f -> patchFork(f, Expressions.asAttributes(nullAliases)));
     }
 
     /**
@@ -115,95 +113,73 @@ private static LogicalPlan nullify(LogicalPlan plan, List<UnresolvedAttribute> u
      * <p>
      * It also "patches" the introduced attributes through the plan, where needed (like through Fork/UntionAll).
      */
-    private static LogicalPlan load(LogicalPlan plan, List<UnresolvedAttribute> unresolved) {
+    private static LogicalPlan load(LogicalPlan plan, Set<UnresolvedAttribute> unresolved) {
         // TODO: this will need to be revisited for non-lookup joining or scenarios where we won't want extraction from specific sources
-        var transformed = plan.transformUp(EsRelation.class, esr -> {
+        return plan.transformUp(EsRelation.class, esr -> {
             if (esr.indexMode() == IndexMode.LOOKUP) {
                 return esr;
             }
-            List<FieldAttribute> fieldsToLoad = fieldsToLoad(unresolved, esr.outputSet().names());
+            List<FieldAttribute> fieldsToLoad = fieldsToLoad(unresolved, Expressions.names(esr.output()));
             // there shouldn't be any duplicates, we can just merge the two lists
             return fieldsToLoad.isEmpty() ? esr : esr.withAttributes(combine(esr.output(), fieldsToLoad));
         });
-
-        return transformed.transformUp(Fork.class, f -> patchFork(f, Expressions.asAttributes(fieldsToLoad(unresolved, Set.of()))));
     }
 
-    private static List<FieldAttribute> fieldsToLoad(List<UnresolvedAttribute> unresolved, Set<String> exclude) {
+    private static List<FieldAttribute> fieldsToLoad(Set<UnresolvedAttribute> unresolved, List<String> exclude) {
         List<FieldAttribute> insisted = new ArrayList<>(unresolved.size());
-        Set<String> names = new LinkedHashSet<>(unresolved.size());
         for (var ua : unresolved) {
-            // some plans may reference the same UA multiple times (Aggregate groupings in aggregates, Eval)
-            if (names.contains(ua.name()) == false && exclude.contains(ua.name()) == false) {
+            if (exclude.contains(ua.name()) == false) {
                 insisted.add(insistKeyword(ua));
-                names.add(ua.name());
             }
         }
         return insisted;
     }
 
-    // TODO: would an alternative to this be to drop the current Fork and have ResolveRefs#resolveFork re-resolve it. We might need
-    // some plan delimiters/markers to make it unequivocal which nodes belong to "make Fork work" - like (Limit-Project[-Eval])s - and
-    // which don't.
-    private static Fork patchFork(Fork fork, List<Attribute> aliasAttributes) {
-        // if no child outputs the attribute, don't patch it through at all.
-        aliasAttributes.removeIf(a -> fork.children().stream().anyMatch(f -> descendantOutputsAttribute(f, a)) == false);
-        if (aliasAttributes.isEmpty()) {
-            return fork;
-        }
-
+    // TODO: would an alternative to this be to have ResolveRefs#resolveFork re-resolve the Fork?
+    // We might need some plan delimiters/markers to make it unequivocal which nodes belong to
+    // "make Fork work" - like ([Limit -] Project [- Eval])s - and which don't.
+    // PruneColumns does the same dance. There's some fragility w.r.t. assuming there to be a top Project and danger of the outputs not
+    // being aligned after applying the changes.
+    /**
+     * Update the Fork's top Projects in the subplans, and correspondingly, its output, to account for newly introduced aliases.
+     */
+    private static Fork patchFork(Fork fork) {
         List<LogicalPlan> newChildren = new ArrayList<>(fork.children().size());
+        boolean childrenChanged = false;
         for (var child : fork.children()) {
             Holder<Boolean> patched = new Holder<>(false);
-            child = child.transformDown(
+            var transformed = child.transformDown(
                 // TODO add a suitable forEachDownMayReturnEarly equivalent
                 n -> patched.get() == false && n instanceof Project, // process top Project only (Fork-injected)
                 n -> {
                     patched.set(true);
-                    return patchForkProject((Project) n, aliasAttributes);
+                    return patchForkProject((Project) n);
                 }
             );
-            if (patched.get() == false) { // assert
-                throw new EsqlIllegalArgumentException("Fork child misses a top projection");
-            }
-            newChildren.add(child);
-        }
-
-        return fork.replaceSubPlansAndOutput(newChildren, combine(fork.output(), aliasAttributes));
-    }
-
-    private static Project patchForkProject(Project project, List<Attribute> aliasAttributes) {
-        // refresh the IDs for each UnionAll child (needed for correct resolution of convert functions; see collectConvertFunctions())
-        aliasAttributes = aliasAttributes.stream().map(a -> a.withId(new NameId())).toList();
-
-        project = project.withProjections(combine(project.projections(), aliasAttributes));
-
-        // If Project's child doesn't output the attribute, introduce a null-Eval'ing. This is similar to what Fork-resolution does.
-        List<Alias> nullAliases = new ArrayList<>(aliasAttributes.size());
-        for (var attribute : aliasAttributes) {
-            if (descendantOutputsAttribute(project, attribute) == false) {
-                nullAliases.add(nullAlias(attribute));
-            }
+            childrenChanged |= transformed != child;
+            newChildren.add(transformed);
         }
-        return nullAliases.isEmpty() ? project : project.replaceChild(new Eval(project.source(), project.child(), nullAliases));
+        return childrenChanged ? fork.withSubPlans(newChildren) : fork;
     }
 
     /**
-     * Fork injects a {@code Limit - Project (- Eval)} top structure into its subtrees. Skip the top Limit (if present) and Project in
-     * the {@code plan} and look at the output of the remaining fragment.
-     * @return {@code true} if this fragment's output contains the {@code attribute}.
+     * Add any missing attributes that are found in the child's output but not in the Project's output. These have been injected before
+     * by the evalUnresolvedAtopXXX methods and need to be "let through" the Project.
      */
-    private static boolean descendantOutputsAttribute(LogicalPlan plan, Attribute attribute) {
-        plan = plan instanceof Limit limit ? limit.child() : plan;
-        if (plan instanceof Project project) {
-            return project.child().outputSet().names().contains(attribute.name());
+    private static Project patchForkProject(Project project) {
+        var projectOutput = project.output();
+        var childOutput = project.child().output();
+        if (projectOutput.equals(childOutput) == false) {
+            List<Attribute> delta = new ArrayList<>(childOutput);
+            delta.removeAll(projectOutput);
+            project = project.withProjections(mergeOutputAttributes(delta, projectOutput));
         }
-        throw new EsqlIllegalArgumentException("unexpected node type [{}]", plan); // assert
+        return project;
     }
 
     private static LogicalPlan refreshPlan(LogicalPlan plan, List<UnresolvedAttribute> unresolved) {
         var refreshed = refreshUnresolved(plan, unresolved);
-        return refreshChildren(refreshed);
+        return refreshed.transformDown(Fork.class, ResolveUnmapped::patchFork);
     }
 
     /**
@@ -222,25 +198,10 @@ private static LogicalPlan refreshUnresolved(LogicalPlan plan, List<UnresolvedAt
         });
     }
 
-    /**
-     * @return A plan having all nodes recreated (no properties changed, otherwise). This is needed to clear internal, lazy-eval'd and
-     * cached state, such as the output. The rule inserts new attributes in the plan, so the output of all the nodes downstream these
-     * insertions need be recomputed.
-     */
-    private static LogicalPlan refreshChildren(LogicalPlan plan) {
-        var planChildren = plan.children();
-        if (planChildren.isEmpty()) {
-            return plan;
-        }
-        List<LogicalPlan> newChildren = new ArrayList<>(planChildren.size());
-        planChildren.forEach(child -> newChildren.add(refreshChildren(child)));
-        return plan.replaceChildren(newChildren);
-    }
-
     /**
      * Inserts an Eval atop each child of the given {@code nAry}, if the child is a LeafPlan.
      */
-    private static LogicalPlan evalUnresolvedNary(LogicalPlan nAry, List<Alias> nullAliases) {
+    private static LogicalPlan evalUnresolvedAtopNary(LogicalPlan nAry, List<Alias> nullAliases) {
         List<LogicalPlan> newChildren = new ArrayList<>(nAry.children().size());
         boolean changed = false;
         for (var child : nAry.children()) {
@@ -257,7 +218,7 @@ private static LogicalPlan evalUnresolvedNary(LogicalPlan nAry, List<Alias> null
     /**
      * Inserts an Eval atop the given {@code unaryAtopSource}, if this isn't an Eval already. Otherwise it merges the nullAliases into it.
      */
-    private static LogicalPlan evalUnresolvedUnary(UnaryPlan unaryAtopSource, List<Alias> nullAliases) {
+    private static LogicalPlan evalUnresolvedAtopUnary(UnaryPlan unaryAtopSource, List<Alias> nullAliases) {
         assertSourceType(unaryAtopSource.child());
         if (unaryAtopSource instanceof Eval eval && eval.resolved()) { // if this Eval isn't resolved, insert a new (resolved) one
             List<Alias> pre = new ArrayList<>(nullAliases.size());
@@ -291,16 +252,23 @@ private static void assertSourceType(LogicalPlan source) {
         }
     }
 
-    private static List<Alias> nullAliases(List<UnresolvedAttribute> unresolved) {
-        Map<String, Alias> aliasesMap = new LinkedHashMap<>(unresolved.size());
-        unresolved.forEach(u -> aliasesMap.computeIfAbsent(u.name(), k -> nullAlias(u)));
-        return new ArrayList<>(aliasesMap.values());
+    private static List<Alias> nullAliases(Set<UnresolvedAttribute> unresolved) {
+        List<Alias> aliases = new ArrayList<>(unresolved.size());
+        unresolved.forEach(u -> aliases.add(nullAlias(u)));
+        return aliases;
     }
 
-    private static Alias nullAlias(Attribute attribute) {
+    private static Alias nullAlias(NamedExpression attribute) {
         return new Alias(attribute.source(), attribute.name(), NULLIFIED);
     }
 
+    // Some plans may reference the same UA multiple times (Aggregate groupings in aggregates, Eval): dedupe
+    private static LinkedHashSet<UnresolvedAttribute> unresolvedLinkedSet(List<UnresolvedAttribute> unresolved) {
+        Map<String, UnresolvedAttribute> aliasesMap = new LinkedHashMap<>(unresolved.size());
+        unresolved.forEach(u -> aliasesMap.putIfAbsent(u.name(), u));
+        return new LinkedHashSet<>(aliasesMap.values());
+    }
+
     /**
      * @return all the {@link UnresolvedAttribute}s in the given node / {@code plan}, but excluding the {@link UnresolvedPattern} and
      * {@link UnresolvedTimestamp} subtypes.