Fix parse_cte.c's failure to examine sub-WITHs in DML statements.
authorTom Lane <[email protected]>
Sat, 5 Apr 2025 19:01:33 +0000 (15:01 -0400)
committerTom Lane <[email protected]>
Sat, 5 Apr 2025 19:01:33 +0000 (15:01 -0400)
makeDependencyGraphWalker thought that only SelectStmt nodes could
contain a WithClause.  Which was true in our original implementation
of WITH, but astonishingly we missed updating this code when we added
the ability to attach WITH to INSERT/UPDATE/DELETE (and later MERGE).
Moreover, since it was coded to deliberately block recursion to a
WithClause, even updating raw_expression_tree_walker didn't save it.

The upshot of this was that we didn't see references to outer CTE
names appearing within an inner WITH, and would neither complain about
disallowed recursion nor account for such references when sorting CTEs
into a usable order.  The lack of complaints about this is perhaps not
so surprising, because typical usage of WITH wouldn't hit either case.
Still, it's pretty broken; failing to detect recursion here leads to
assert failures or worse later on.

Fix by factoring out the processing of sub-WITHs into a new function
WalkInnerWith, and invoking that for all the statement types that
can have WITH.

Bug: #18878
Reported-by: Yu Liang <[email protected]>
Author: Tom Lane <[email protected]>
Discussion: https://postgr.es/m/18878-a26fa5ab6be2f2cf@postgresql.org
Backpatch-through: 13

src/backend/parser/parse_cte.c
src/test/regress/expected/with.out
src/test/regress/sql/with.sql

index d7ccb65d64735fdf93af81293c196f0b89012641..738c1c8652ee6d54e25987e3ebb1c42c28f3379f 100644 (file)
@@ -88,6 +88,7 @@ static void analyzeCTE(ParseState *pstate, CommonTableExpr *cte);
 /* Dependency processing functions */
 static void makeDependencyGraph(CteState *cstate);
 static bool makeDependencyGraphWalker(Node *node, CteState *cstate);
+static void WalkInnerWith(Node *stmt, WithClause *withClause, CteState *cstate);
 static void TopologicalSort(ParseState *pstate, CteItem *items, int numitems);
 
 /* Recursion validity checker functions */
@@ -731,58 +732,69 @@ makeDependencyGraphWalker(Node *node, CteState *cstate)
    if (IsA(node, SelectStmt))
    {
        SelectStmt *stmt = (SelectStmt *) node;
-       ListCell   *lc;
 
        if (stmt->withClause)
        {
-           if (stmt->withClause->recursive)
-           {
-               /*
-                * In the RECURSIVE case, all query names of the WITH are
-                * visible to all WITH items as well as the main query. So
-                * push them all on, process, pop them all off.
-                */
-               cstate->innerwiths = lcons(stmt->withClause->ctes,
-                                          cstate->innerwiths);
-               foreach(lc, stmt->withClause->ctes)
-               {
-                   CommonTableExpr *cte = (CommonTableExpr *) lfirst(lc);
+           /* Examine the WITH clause and the SelectStmt */
+           WalkInnerWith(node, stmt->withClause, cstate);
+           /* We're done examining the SelectStmt */
+           return false;
+       }
+       /* if no WITH clause, just fall through for normal processing */
+   }
+   else if (IsA(node, InsertStmt))
+   {
+       InsertStmt *stmt = (InsertStmt *) node;
 
-                   (void) makeDependencyGraphWalker(cte->ctequery, cstate);
-               }
-               (void) raw_expression_tree_walker(node,
-                                                 makeDependencyGraphWalker,
-                                                 (void *) cstate);
-               cstate->innerwiths = list_delete_first(cstate->innerwiths);
-           }
-           else
-           {
-               /*
-                * In the non-RECURSIVE case, query names are visible to the
-                * WITH items after them and to the main query.
-                */
-               cstate->innerwiths = lcons(NIL, cstate->innerwiths);
-               foreach(lc, stmt->withClause->ctes)
-               {
-                   CommonTableExpr *cte = (CommonTableExpr *) lfirst(lc);
-                   ListCell   *cell1;
+       if (stmt->withClause)
+       {
+           /* Examine the WITH clause and the InsertStmt */
+           WalkInnerWith(node, stmt->withClause, cstate);
+           /* We're done examining the InsertStmt */
+           return false;
+       }
+       /* if no WITH clause, just fall through for normal processing */
+   }
+   else if (IsA(node, DeleteStmt))
+   {
+       DeleteStmt *stmt = (DeleteStmt *) node;
 
-                   (void) makeDependencyGraphWalker(cte->ctequery, cstate);
-                   /* note that recursion could mutate innerwiths list */
-                   cell1 = list_head(cstate->innerwiths);
-                   lfirst(cell1) = lappend((List *) lfirst(cell1), cte);
-               }
-               (void) raw_expression_tree_walker(node,
-                                                 makeDependencyGraphWalker,
-                                                 (void *) cstate);
-               cstate->innerwiths = list_delete_first(cstate->innerwiths);
-           }
-           /* We're done examining the SelectStmt */
+       if (stmt->withClause)
+       {
+           /* Examine the WITH clause and the DeleteStmt */
+           WalkInnerWith(node, stmt->withClause, cstate);
+           /* We're done examining the DeleteStmt */
            return false;
        }
        /* if no WITH clause, just fall through for normal processing */
    }
-   if (IsA(node, WithClause))
+   else if (IsA(node, UpdateStmt))
+   {
+       UpdateStmt *stmt = (UpdateStmt *) node;
+
+       if (stmt->withClause)
+       {
+           /* Examine the WITH clause and the UpdateStmt */
+           WalkInnerWith(node, stmt->withClause, cstate);
+           /* We're done examining the UpdateStmt */
+           return false;
+       }
+       /* if no WITH clause, just fall through for normal processing */
+   }
+   else if (IsA(node, MergeStmt))
+   {
+       MergeStmt  *stmt = (MergeStmt *) node;
+
+       if (stmt->withClause)
+       {
+           /* Examine the WITH clause and the MergeStmt */
+           WalkInnerWith(node, stmt->withClause, cstate);
+           /* We're done examining the MergeStmt */
+           return false;
+       }
+       /* if no WITH clause, just fall through for normal processing */
+   }
+   else if (IsA(node, WithClause))
    {
        /*
         * Prevent raw_expression_tree_walker from recursing directly into a
@@ -796,6 +808,60 @@ makeDependencyGraphWalker(Node *node, CteState *cstate)
                                      (void *) cstate);
 }
 
+/*
+ * makeDependencyGraphWalker's recursion into a statement having a WITH clause.
+ *
+ * This subroutine is concerned with updating the innerwiths list correctly
+ * based on the visibility rules for CTE names.
+ */
+static void
+WalkInnerWith(Node *stmt, WithClause *withClause, CteState *cstate)
+{
+   ListCell   *lc;
+
+   if (withClause->recursive)
+   {
+       /*
+        * In the RECURSIVE case, all query names of the WITH are visible to
+        * all WITH items as well as the main query.  So push them all on,
+        * process, pop them all off.
+        */
+       cstate->innerwiths = lcons(withClause->ctes, cstate->innerwiths);
+       foreach(lc, withClause->ctes)
+       {
+           CommonTableExpr *cte = (CommonTableExpr *) lfirst(lc);
+
+           (void) makeDependencyGraphWalker(cte->ctequery, cstate);
+       }
+       (void) raw_expression_tree_walker(stmt,
+                                         makeDependencyGraphWalker,
+                                         (void *) cstate);
+       cstate->innerwiths = list_delete_first(cstate->innerwiths);
+   }
+   else
+   {
+       /*
+        * In the non-RECURSIVE case, query names are visible to the WITH
+        * items after them and to the main query.
+        */
+       cstate->innerwiths = lcons(NIL, cstate->innerwiths);
+       foreach(lc, withClause->ctes)
+       {
+           CommonTableExpr *cte = (CommonTableExpr *) lfirst(lc);
+           ListCell   *cell1;
+
+           (void) makeDependencyGraphWalker(cte->ctequery, cstate);
+           /* note that recursion could mutate innerwiths list */
+           cell1 = list_head(cstate->innerwiths);
+           lfirst(cell1) = lappend((List *) lfirst(cell1), cte);
+       }
+       (void) raw_expression_tree_walker(stmt,
+                                         makeDependencyGraphWalker,
+                                         (void *) cstate);
+       cstate->innerwiths = list_delete_first(cstate->innerwiths);
+   }
+}
+
 /*
  * Sort by dependencies, using a standard topological sort operation
  */
index 204d5d7d7caf74f6a73fd641869485ec34f3dafb..a64a6a858aaa111630a910eaa5b17452c71d70d4 100644 (file)
@@ -2031,6 +2031,14 @@ WITH RECURSIVE x(n) AS (
 ERROR:  ORDER BY in a recursive query is not implemented
 LINE 3:   ORDER BY (SELECT n FROM x))
                    ^
+-- and this
+WITH RECURSIVE x(n) AS (
+  WITH sub_cte AS (SELECT * FROM x)
+  DELETE FROM graph RETURNING f)
+   SELECT * FROM x;
+ERROR:  recursive query "x" must not contain data-modifying statements
+LINE 1: WITH RECURSIVE x(n) AS (
+                       ^
 CREATE TEMPORARY TABLE y (a INTEGER);
 INSERT INTO y SELECT generate_series(1, 10);
 -- LEFT JOIN
index 86f507efb276b3c4f88498c63dd50f8092be4ced..0a7c5a1784c5967ffed52d36e8cb253cc7b25acf 100644 (file)
@@ -930,6 +930,13 @@ WITH RECURSIVE x(n) AS (
   ORDER BY (SELECT n FROM x))
    SELECT * FROM x;
 
+-- and this
+WITH RECURSIVE x(n) AS (
+  WITH sub_cte AS (SELECT * FROM x)
+  DELETE FROM graph RETURNING f)
+   SELECT * FROM x;
+
+
 CREATE TEMPORARY TABLE y (a INTEGER);
 INSERT INTO y SELECT generate_series(1, 10);