Adjust cost model for HashAgg that spills to disk.

author Jeff Davis <jdavis@postgresql.org>

Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)

committer Jeff Davis <jdavis@postgresql.org>

Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)
author Jeff Davis <jdavis@postgresql.org>
Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)
committer Jeff Davis <jdavis@postgresql.org>
Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)
diff --git a/src/backend/optimizer/path/costsize.c b/src/backend/optimizer/path/costsize.c

index fda4b2c6e875f513c8bf78c87d878e184664bc95..cd3716d494f033f2d2d1a753a291fc4606715120 100644 (file)
--- a/src/backend/optimizer/path/costsize.c
+++ b/src/backend/optimizer/path/costsize.c
@@ -2416,6 +2416,7 @@ cost_agg(Path *path, PlannerInfo *root,
                 double          pages;
                 double          pages_written = 0.0;
                 double          pages_read = 0.0;
+               double          spill_cost;
                 double          hashentrysize;
                 double          nbatches;
                 Size            mem_limit;
@@ -2453,9 +2454,21 @@ cost_agg(Path *path, PlannerInfo *root,
                 pages = relation_byte_size(input_tuples, input_width) / BLCKSZ;
                 pages_written = pages_read = pages * depth;
  
+               /*
+                * HashAgg has somewhat worse IO behavior than Sort on typical
+                * hardware/OS combinations. Account for this with a generic penalty.
+                */
+               pages_read *= 2.0;
+               pages_written *= 2.0;
+
                 startup_cost += pages_written * random_page_cost;
                 total_cost += pages_written * random_page_cost;
                 total_cost += pages_read * seq_page_cost;
+
+               /* account for CPU cost of spilling a tuple and reading it back */
+               spill_cost = depth * input_tuples * 2.0 * cpu_tuple_cost;
+               startup_cost += spill_cost;
+               total_cost += spill_cost;
         }
  
         /*
author	Jeff Davis <jdavis@postgresql.org>
	Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)
committer	Jeff Davis <jdavis@postgresql.org>
	Mon, 7 Sep 2020 20:31:59 +0000 (13:31 -0700)