ExecHashRemoveNextSkewBucket must physically copy tuples to main hashtable.

author Tom Lane <tgl@sss.pgh.pa.us>

Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)

committer Tom Lane <tgl@sss.pgh.pa.us>

Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)
author Tom Lane <tgl@sss.pgh.pa.us>
Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)
committer Tom Lane <tgl@sss.pgh.pa.us>
Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)
diff --git a/src/backend/executor/nodeHash.c b/src/backend/executor/nodeHash.c

index e7e51d171723c0c721c7a909cd69bc598c44fdcc..ab766b84dc92c752f12836bf0a7fd0a2df899c71 100644 (file)
--- a/src/backend/executor/nodeHash.c
+++ b/src/backend/executor/nodeHash.c
@@ -1574,8 +1574,19 @@ ExecHashRemoveNextSkewBucket(HashJoinTable hashtable)
                 if (batchno == hashtable->curbatch)
                 {
                         /* Move the tuple to the main hash table */
-                       hashTuple->next = hashtable->buckets[bucketno];
-                       hashtable->buckets[bucketno] = hashTuple;
+                       HashJoinTuple copyTuple;
+
+                       /*
+                        * We must copy the tuple into the dense storage, else it will not
+                        * be found by, eg, ExecHashIncreaseNumBatches.
+                        */
+                       copyTuple = (HashJoinTuple) dense_alloc(hashtable, tupleSize);
+                       memcpy(copyTuple, hashTuple, tupleSize);
+                       pfree(hashTuple);
+
+                       copyTuple->next = hashtable->buckets[bucketno];
+                       hashtable->buckets[bucketno] = copyTuple;
+
                         /* We have reduced skew space, but overall space doesn't change */
                         hashtable->spaceUsedSkew -= tupleSize;
                 }
diff --git a/src/test/regress/expected/join.out b/src/test/regress/expected/join.out

index a0c3461e38e97805107f3d41af7bfbf102951983..bade392394644ed5057a7c2c7d445e85415b4154 100644 (file)
--- a/src/test/regress/expected/join.out
+++ b/src/test/regress/expected/join.out
@@ -2331,6 +2331,34 @@ select tt1.*, tt2.* from tt2 right join tt1 on tt1.joincol = tt2.joincol;
  reset enable_hashjoin;
  reset enable_nestloop;
  --
+-- regression test for bug #13908 (hash join with skew tuples & nbatch increase)
+--
+set work_mem to '64kB';
+set enable_mergejoin to off;
+explain (costs off)
+select count(*) from tenk1 a, tenk1 b
+  where a.hundred = b.thousand and (b.fivethous % 10) < 10;
+                         QUERY PLAN                         
+------------------------------------------------------------
+ Aggregate
+   ->  Hash Join
+         Hash Cond: (a.hundred = b.thousand)
+         ->  Index Only Scan using tenk1_hundred on tenk1 a
+         ->  Hash
+               ->  Seq Scan on tenk1 b
+                     Filter: ((fivethous % 10) < 10)
+(7 rows)
+
+select count(*) from tenk1 a, tenk1 b
+  where a.hundred = b.thousand and (b.fivethous % 10) < 10;
+ count  
+--------
+ 100000
+(1 row)
+
+reset work_mem;
+reset enable_mergejoin;
+--
  -- regression test for 8.2 bug with improper re-ordering of left joins
  --
  create temp table tt3(f1 int, f2 text);
diff --git a/src/test/regress/sql/join.sql b/src/test/regress/sql/join.sql

index 560c64fce412bb7990fe9281d13cfe1edcf689fc..c3902d9e9fc6a337623f488e00a16c4b7ab604a0 100644 (file)
--- a/src/test/regress/sql/join.sql
+++ b/src/test/regress/sql/join.sql
@@ -463,6 +463,22 @@ select tt1.*, tt2.* from tt2 right join tt1 on tt1.joincol = tt2.joincol;
  reset enable_hashjoin;
  reset enable_nestloop;
  
+--
+-- regression test for bug #13908 (hash join with skew tuples & nbatch increase)
+--
+
+set work_mem to '64kB';
+set enable_mergejoin to off;
+
+explain (costs off)
+select count(*) from tenk1 a, tenk1 b
+  where a.hundred = b.thousand and (b.fivethous % 10) < 10;
+select count(*) from tenk1 a, tenk1 b
+  where a.hundred = b.thousand and (b.fivethous % 10) < 10;
+
+reset work_mem;
+reset enable_mergejoin;
+
  --
  -- regression test for 8.2 bug with improper re-ordering of left joins
  --
author	Tom Lane <tgl@sss.pgh.pa.us>
	Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)
committer	Tom Lane <tgl@sss.pgh.pa.us>
	Sun, 7 Feb 2016 17:29:17 +0000 (12:29 -0500)
src/backend/executor/nodeHash.c		patch \| blob \| history
src/test/regress/expected/join.out		patch \| blob \| history
src/test/regress/sql/join.sql		patch \| blob \| history