Fix overeager pushdown of HAVING clauses when grouping sets are used.

author Andres Freund <[email protected]>

Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)

committer Andres Freund <[email protected]>

Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)
author Andres Freund <[email protected]>
Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)
committer Andres Freund <[email protected]>
Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)
diff --git a/src/backend/optimizer/plan/planner.c b/src/backend/optimizer/plan/planner.c

index a3cc27464c10c39b02df64a13ca2d54e1359d565..4f8e4c07d615a1dadf8e1f85380fdbf333d3d7b1 100644 (file)
--- a/src/backend/optimizer/plan/planner.c
+++ b/src/backend/optimizer/plan/planner.c
@@ -653,13 +653,19 @@ subquery_planner(PlannerGlobal *glob, Query *parse,
      * In some cases we may want to transfer a HAVING clause into WHERE. We
      * cannot do so if the HAVING clause contains aggregates (obviously) or
      * volatile functions (since a HAVING clause is supposed to be executed
-    * only once per group).  Also, it may be that the clause is so expensive
-    * to execute that we're better off doing it only once per group, despite
-    * the loss of selectivity.  This is hard to estimate short of doing the
-    * entire planning process twice, so we use a heuristic: clauses
-    * containing subplans are left in HAVING.  Otherwise, we move or copy the
-    * HAVING clause into WHERE, in hopes of eliminating tuples before
-    * aggregation instead of after.
+    * only once per group).  We also can't do this if there are any nonempty
+    * grouping sets; moving such a clause into WHERE would potentially change
+    * the results, if any referenced column isn't present in all the grouping
+    * sets.  (If there are only empty grouping sets, then the HAVING clause
+    * must be degenerate as discussed below.)
+    *
+    * Also, it may be that the clause is so expensive to execute that we're
+    * better off doing it only once per group, despite the loss of
+    * selectivity.  This is hard to estimate short of doing the entire
+    * planning process twice, so we use a heuristic: clauses containing
+    * subplans are left in HAVING.  Otherwise, we move or copy the HAVING
+    * clause into WHERE, in hopes of eliminating tuples before aggregation
+    * instead of after.
      *
      * If the query has explicit grouping then we can simply move such a
      * clause into WHERE; any group that fails the clause will not be in the
@@ -679,7 +685,8 @@ subquery_planner(PlannerGlobal *glob, Query *parse,
     {
         Node       *havingclause = (Node *) lfirst(l);
  
-       if (contain_agg_clause(havingclause) ||
+       if ((parse->groupClause && parse->groupingSets) ||
+           contain_agg_clause(havingclause) ||
             contain_volatile_functions(havingclause) ||
             contain_subplans(havingclause))
         {
diff --git a/src/test/regress/expected/groupingsets.out b/src/test/regress/expected/groupingsets.out

index b0b8c4b7f26d60c40ee736e9f6f86beda802f903..260ccd52c87b03831133d1679e28221c9f0aca84 100644 (file)
--- a/src/test/regress/expected/groupingsets.out
+++ b/src/test/regress/expected/groupingsets.out
@@ -607,6 +607,60 @@ having exists (select 1 from onek b where sum(distinct a.four) = b.four);
     9 |   3
  (25 rows)
  
+-- Tests around pushdown of HAVING clauses, partially testing against previous bugs
+select a,count(*) from gstest2 group by rollup(a) order by a;
+ a | count 
+---+-------
+ 1 |     8
+ 2 |     1
+   |     9
+(3 rows)
+
+select a,count(*) from gstest2 group by rollup(a) having a is distinct from 1 order by a;
+ a | count 
+---+-------
+ 2 |     1
+   |     9
+(2 rows)
+
+explain (costs off)
+  select a,count(*) from gstest2 group by rollup(a) having a is distinct from 1 order by a;
+            QUERY PLAN            
+----------------------------------
+ GroupAggregate
+   Group Key: a
+   Group Key: ()
+   Filter: (a IS DISTINCT FROM 1)
+   ->  Sort
+         Sort Key: a
+         ->  Seq Scan on gstest2
+(7 rows)
+
+select v.c, (select count(*) from gstest2 group by () having v.c)
+  from (values (false),(true)) v(c) order by v.c;
+ c | count 
+---+-------
+ f |      
+ t |     9
+(2 rows)
+
+explain (costs off)
+  select v.c, (select count(*) from gstest2 group by () having v.c)
+    from (values (false),(true)) v(c) order by v.c;
+                        QUERY PLAN                         
+-----------------------------------------------------------
+ Sort
+   Sort Key: "*VALUES*".column1
+   ->  Values Scan on "*VALUES*"
+         SubPlan 1
+           ->  Aggregate
+                 Group Key: ()
+                 Filter: "*VALUES*".column1
+                 ->  Result
+                       One-Time Filter: "*VALUES*".column1
+                       ->  Seq Scan on gstest2
+(10 rows)
+
  -- HAVING with GROUPING queries
  select ten, grouping(ten) from onek
  group by grouping sets(ten) having grouping(ten) >= 0
diff --git a/src/test/regress/sql/groupingsets.sql b/src/test/regress/sql/groupingsets.sql

index bff85d0db558c9263ed6317a4f178350f61c73a9..71cc0ec90077c16ee62c38323fb9195b32a80308 100644 (file)
--- a/src/test/regress/sql/groupingsets.sql
+++ b/src/test/regress/sql/groupingsets.sql
@@ -183,6 +183,18 @@ select ten, sum(distinct four) from onek a
  group by grouping sets((ten,four),(ten))
  having exists (select 1 from onek b where sum(distinct a.four) = b.four);
  
+-- Tests around pushdown of HAVING clauses, partially testing against previous bugs
+select a,count(*) from gstest2 group by rollup(a) order by a;
+select a,count(*) from gstest2 group by rollup(a) having a is distinct from 1 order by a;
+explain (costs off)
+  select a,count(*) from gstest2 group by rollup(a) having a is distinct from 1 order by a;
+
+select v.c, (select count(*) from gstest2 group by () having v.c)
+  from (values (false),(true)) v(c) order by v.c;
+explain (costs off)
+  select v.c, (select count(*) from gstest2 group by () having v.c)
+    from (values (false),(true)) v(c) order by v.c;
+
  -- HAVING with GROUPING queries
  select ten, grouping(ten) from onek
  group by grouping sets(ten) having grouping(ten) >= 0
author	Andres Freund <[email protected]>
	Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)
committer	Andres Freund <[email protected]>
	Mon, 8 Feb 2016 10:03:31 +0000 (11:03 +0100)
src/backend/optimizer/plan/planner.c		patch \| blob \| blame \| history
src/test/regress/expected/groupingsets.out		patch \| blob \| blame \| history
src/test/regress/sql/groupingsets.sql		patch \| blob \| blame \| history