Commit 1d9351a8 authored by Tom Lane's avatar Tom Lane

Fix hash partition pruning with asymmetric partition sets.

perform_pruning_combine_step() was not taught about the number of
partition indexes used in hash partitioning; more embarrassingly,
get_matching_hash_bounds() also had it wrong.  These errors are masked
in the common case where all the partitions have the same modulus
and no partition is missing.  However, with missing or unequal-size
partitions, we could erroneously prune some partitions that need
to be scanned, leading to silently wrong query answers.

While a minimal-footprint fix for this could be to export
get_partition_bound_num_indexes and make the incorrect functions use it,
I'm of the opinion that that function should never have existed in the
first place.  It's not reasonable data structure design that
PartitionBoundInfoData lacks any explicit record of the length of
its indexes[] array.  Perhaps that was all right when it could always
be assumed equal to ndatums, but something should have been done about
it as soon as that stopped being true.  Putting in an explicit
"nindexes" field makes both partition_bounds_equal() and
partition_bounds_copy() simpler, safer, and faster than before,
and removes explicit knowledge of the number-of-partition-indexes
rules from some other places too.

This change also makes get_hash_partition_greatest_modulus obsolete.
I left that in place in case any external code uses it, but no core
code does anymore.

Per bug #16840 from Michał Albrycht.  Back-patch to v11 where the
hash partitioning code came in.  (In the back branches, add the new
field at the end of PartitionBoundInfoData to minimize ABI risks.)

Discussion: https://postgr.es/m/16840-571a22976f829ad4@postgresql.org
parent 1b242f42
...@@ -1323,16 +1323,14 @@ get_partition_for_tuple(PartitionDispatch pd, Datum *values, bool *isnull) ...@@ -1323,16 +1323,14 @@ get_partition_for_tuple(PartitionDispatch pd, Datum *values, bool *isnull)
{ {
case PARTITION_STRATEGY_HASH: case PARTITION_STRATEGY_HASH:
{ {
int greatest_modulus;
uint64 rowHash; uint64 rowHash;
greatest_modulus = get_hash_partition_greatest_modulus(boundinfo);
rowHash = compute_partition_hash_value(key->partnatts, rowHash = compute_partition_hash_value(key->partnatts,
key->partsupfunc, key->partsupfunc,
key->partcollation, key->partcollation,
values, isnull); values, isnull);
part_index = boundinfo->indexes[rowHash % greatest_modulus]; part_index = boundinfo->indexes[rowHash % boundinfo->nindexes];
} }
break; break;
......
...@@ -224,7 +224,6 @@ static int partition_range_bsearch(int partnatts, FmgrInfo *partsupfunc, ...@@ -224,7 +224,6 @@ static int partition_range_bsearch(int partnatts, FmgrInfo *partsupfunc,
Oid *partcollation, Oid *partcollation,
PartitionBoundInfo boundinfo, PartitionBoundInfo boundinfo,
PartitionRangeBound *probe, int32 *cmpval); PartitionRangeBound *probe, int32 *cmpval);
static int get_partition_bound_num_indexes(PartitionBoundInfo b);
static Expr *make_partition_op_expr(PartitionKey key, int keynum, static Expr *make_partition_op_expr(PartitionKey key, int keynum,
uint16 strategy, Expr *arg1, Expr *arg2); uint16 strategy, Expr *arg1, Expr *arg2);
static Oid get_partition_operator(PartitionKey key, int col, static Oid get_partition_operator(PartitionKey key, int col,
...@@ -398,6 +397,7 @@ create_hash_bounds(PartitionBoundSpec **boundspecs, int nparts, ...@@ -398,6 +397,7 @@ create_hash_bounds(PartitionBoundSpec **boundspecs, int nparts,
boundinfo->ndatums = ndatums; boundinfo->ndatums = ndatums;
boundinfo->datums = (Datum **) palloc0(ndatums * sizeof(Datum *)); boundinfo->datums = (Datum **) palloc0(ndatums * sizeof(Datum *));
boundinfo->nindexes = greatest_modulus;
boundinfo->indexes = (int *) palloc(greatest_modulus * sizeof(int)); boundinfo->indexes = (int *) palloc(greatest_modulus * sizeof(int));
for (i = 0; i < greatest_modulus; i++) for (i = 0; i < greatest_modulus; i++)
boundinfo->indexes[i] = -1; boundinfo->indexes[i] = -1;
...@@ -530,6 +530,7 @@ create_list_bounds(PartitionBoundSpec **boundspecs, int nparts, ...@@ -530,6 +530,7 @@ create_list_bounds(PartitionBoundSpec **boundspecs, int nparts,
boundinfo->ndatums = ndatums; boundinfo->ndatums = ndatums;
boundinfo->datums = (Datum **) palloc0(ndatums * sizeof(Datum *)); boundinfo->datums = (Datum **) palloc0(ndatums * sizeof(Datum *));
boundinfo->nindexes = ndatums;
boundinfo->indexes = (int *) palloc(ndatums * sizeof(int)); boundinfo->indexes = (int *) palloc(ndatums * sizeof(int));
/* /*
...@@ -725,8 +726,9 @@ create_range_bounds(PartitionBoundSpec **boundspecs, int nparts, ...@@ -725,8 +726,9 @@ create_range_bounds(PartitionBoundSpec **boundspecs, int nparts,
/* /*
* For range partitioning, an additional value of -1 is stored as the last * For range partitioning, an additional value of -1 is stored as the last
* element. * element of the indexes[] array.
*/ */
boundinfo->nindexes = ndatums + 1;
boundinfo->indexes = (int *) palloc((ndatums + 1) * sizeof(int)); boundinfo->indexes = (int *) palloc((ndatums + 1) * sizeof(int));
for (i = 0; i < ndatums; i++) for (i = 0; i < ndatums; i++)
...@@ -807,45 +809,41 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval, ...@@ -807,45 +809,41 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval,
if (b1->ndatums != b2->ndatums) if (b1->ndatums != b2->ndatums)
return false; return false;
if (b1->nindexes != b2->nindexes)
return false;
if (b1->null_index != b2->null_index) if (b1->null_index != b2->null_index)
return false; return false;
if (b1->default_index != b2->default_index) if (b1->default_index != b2->default_index)
return false; return false;
if (b1->strategy == PARTITION_STRATEGY_HASH) /* For all partition strategies, the indexes[] arrays have to match */
for (i = 0; i < b1->nindexes; i++)
{ {
int greatest_modulus = get_hash_partition_greatest_modulus(b1); if (b1->indexes[i] != b2->indexes[i])
/*
* If two hash partitioned tables have different greatest moduli,
* their partition schemes don't match.
*/
if (greatest_modulus != get_hash_partition_greatest_modulus(b2))
return false; return false;
}
/* Finally, compare the datums[] arrays */
if (b1->strategy == PARTITION_STRATEGY_HASH)
{
/* /*
* We arrange the partitions in the ascending order of their moduli * We arrange the partitions in the ascending order of their moduli
* and remainders. Also every modulus is factor of next larger * and remainders. Also every modulus is factor of next larger
* modulus. Therefore we can safely store index of a given partition * modulus. Therefore we can safely store index of a given partition
* in indexes array at remainder of that partition. Also entries at * in indexes array at remainder of that partition. Also entries at
* (remainder + N * modulus) positions in indexes array are all same * (remainder + N * modulus) positions in indexes array are all same
* for (modulus, remainder) specification for any partition. Thus * for (modulus, remainder) specification for any partition. Thus the
* datums array from both the given bounds are same, if and only if * datums arrays from the given bounds are the same, if and only if
* their indexes array will be same. So, it suffices to compare * their indexes arrays are the same. So, it suffices to compare the
* indexes array. * indexes arrays.
*/ *
for (i = 0; i < greatest_modulus; i++) * Nonetheless make sure that the bounds are indeed the same when the
if (b1->indexes[i] != b2->indexes[i])
return false;
#ifdef USE_ASSERT_CHECKING
/*
* Nonetheless make sure that the bounds are indeed same when the
* indexes match. Hash partition bound stores modulus and remainder * indexes match. Hash partition bound stores modulus and remainder
* at b1->datums[i][0] and b1->datums[i][1] position respectively. * at b1->datums[i][0] and b1->datums[i][1] position respectively.
*/ */
#ifdef USE_ASSERT_CHECKING
for (i = 0; i < b1->ndatums; i++) for (i = 0; i < b1->ndatums; i++)
Assert((b1->datums[i][0] == b2->datums[i][0] && Assert((b1->datums[i][0] == b2->datums[i][0] &&
b1->datums[i][1] == b2->datums[i][1])); b1->datums[i][1] == b2->datums[i][1]));
...@@ -891,15 +889,7 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval, ...@@ -891,15 +889,7 @@ partition_bounds_equal(int partnatts, int16 *parttyplen, bool *parttypbyval,
parttypbyval[j], parttyplen[j])) parttypbyval[j], parttyplen[j]))
return false; return false;
} }
if (b1->indexes[i] != b2->indexes[i])
return false;
} }
/* There are ndatums+1 indexes in case of range partitions */
if (b1->strategy == PARTITION_STRATEGY_RANGE &&
b1->indexes[i] != b2->indexes[i])
return false;
} }
return true; return true;
} }
...@@ -920,8 +910,8 @@ partition_bounds_copy(PartitionBoundInfo src, ...@@ -920,8 +910,8 @@ partition_bounds_copy(PartitionBoundInfo src,
PartitionBoundInfo dest; PartitionBoundInfo dest;
int i; int i;
int ndatums; int ndatums;
int nindexes;
int partnatts; int partnatts;
int num_indexes;
bool hash_part; bool hash_part;
int natts; int natts;
...@@ -929,10 +919,9 @@ partition_bounds_copy(PartitionBoundInfo src, ...@@ -929,10 +919,9 @@ partition_bounds_copy(PartitionBoundInfo src,
dest->strategy = src->strategy; dest->strategy = src->strategy;
ndatums = dest->ndatums = src->ndatums; ndatums = dest->ndatums = src->ndatums;
nindexes = dest->nindexes = src->nindexes;
partnatts = key->partnatts; partnatts = key->partnatts;
num_indexes = get_partition_bound_num_indexes(src);
/* List partitioned tables have only a single partition key. */ /* List partitioned tables have only a single partition key. */
Assert(key->strategy != PARTITION_STRATEGY_LIST || partnatts == 1); Assert(key->strategy != PARTITION_STRATEGY_LIST || partnatts == 1);
...@@ -990,8 +979,8 @@ partition_bounds_copy(PartitionBoundInfo src, ...@@ -990,8 +979,8 @@ partition_bounds_copy(PartitionBoundInfo src,
} }
} }
dest->indexes = (int *) palloc(sizeof(int) * num_indexes); dest->indexes = (int *) palloc(sizeof(int) * nindexes);
memcpy(dest->indexes, src->indexes, sizeof(int) * num_indexes); memcpy(dest->indexes, src->indexes, sizeof(int) * nindexes);
dest->null_index = src->null_index; dest->null_index = src->null_index;
dest->default_index = src->default_index; dest->default_index = src->default_index;
...@@ -2456,6 +2445,7 @@ build_merged_partition_bounds(char strategy, List *merged_datums, ...@@ -2456,6 +2445,7 @@ build_merged_partition_bounds(char strategy, List *merged_datums,
} }
Assert(list_length(merged_indexes) == ndatums); Assert(list_length(merged_indexes) == ndatums);
merged_bounds->nindexes = ndatums;
merged_bounds->indexes = (int *) palloc(sizeof(int) * ndatums); merged_bounds->indexes = (int *) palloc(sizeof(int) * ndatums);
pos = 0; pos = 0;
foreach(lc, merged_indexes) foreach(lc, merged_indexes)
...@@ -2889,7 +2879,7 @@ check_new_partition_bound(char *relname, Relation parent, ...@@ -2889,7 +2879,7 @@ check_new_partition_bound(char *relname, Relation parent,
(errcode(ERRCODE_INVALID_OBJECT_DEFINITION), (errcode(ERRCODE_INVALID_OBJECT_DEFINITION),
errmsg("every hash partition modulus must be a factor of the next larger modulus"))); errmsg("every hash partition modulus must be a factor of the next larger modulus")));
greatest_modulus = get_hash_partition_greatest_modulus(boundinfo); greatest_modulus = boundinfo->nindexes;
remainder = spec->remainder; remainder = spec->remainder;
/* /*
...@@ -3282,18 +3272,15 @@ check_default_partition_contents(Relation parent, Relation default_rel, ...@@ -3282,18 +3272,15 @@ check_default_partition_contents(Relation parent, Relation default_rel,
/* /*
* get_hash_partition_greatest_modulus * get_hash_partition_greatest_modulus
* *
* Returns the greatest modulus of the hash partition bound. The greatest * Returns the greatest modulus of the hash partition bound.
* modulus will be at the end of the datums array because hash partitions are * This is no longer used in the core code, but we keep it around
* arranged in the ascending order of their moduli and remainders. * in case external modules are using it.
*/ */
int int
get_hash_partition_greatest_modulus(PartitionBoundInfo bound) get_hash_partition_greatest_modulus(PartitionBoundInfo bound)
{ {
Assert(bound && bound->strategy == PARTITION_STRATEGY_HASH); Assert(bound && bound->strategy == PARTITION_STRATEGY_HASH);
Assert(bound->datums && bound->ndatums > 0); return bound->nindexes;
Assert(DatumGetInt32(bound->datums[bound->ndatums - 1][0]) > 0);
return DatumGetInt32(bound->datums[bound->ndatums - 1][0]);
} }
/* /*
...@@ -3697,46 +3684,6 @@ qsort_partition_rbound_cmp(const void *a, const void *b, void *arg) ...@@ -3697,46 +3684,6 @@ qsort_partition_rbound_cmp(const void *a, const void *b, void *arg)
b1, b2); b1, b2);
} }
/*
* get_partition_bound_num_indexes
*
* Returns the number of the entries in the partition bound indexes array.
*/
static int
get_partition_bound_num_indexes(PartitionBoundInfo bound)
{
int num_indexes;
Assert(bound);
switch (bound->strategy)
{
case PARTITION_STRATEGY_HASH:
/*
* The number of the entries in the indexes array is same as the
* greatest modulus.
*/
num_indexes = get_hash_partition_greatest_modulus(bound);
break;
case PARTITION_STRATEGY_LIST:
num_indexes = bound->ndatums;
break;
case PARTITION_STRATEGY_RANGE:
/* Range partitioned table has an extra index. */
num_indexes = bound->ndatums + 1;
break;
default:
elog(ERROR, "unexpected partition strategy: %d",
(int) bound->strategy);
}
return num_indexes;
}
/* /*
* get_partition_operator * get_partition_operator
* *
......
...@@ -781,7 +781,10 @@ get_matching_partitions(PartitionPruneContext *context, List *pruning_steps) ...@@ -781,7 +781,10 @@ get_matching_partitions(PartitionPruneContext *context, List *pruning_steps)
scan_default = final_result->scan_default; scan_default = final_result->scan_default;
while ((i = bms_next_member(final_result->bound_offsets, i)) >= 0) while ((i = bms_next_member(final_result->bound_offsets, i)) >= 0)
{ {
int partindex = context->boundinfo->indexes[i]; int partindex;
Assert(i < context->boundinfo->nindexes);
partindex = context->boundinfo->indexes[i];
if (partindex < 0) if (partindex < 0)
{ {
...@@ -2514,20 +2517,19 @@ get_matching_hash_bounds(PartitionPruneContext *context, ...@@ -2514,20 +2517,19 @@ get_matching_hash_bounds(PartitionPruneContext *context,
for (i = 0; i < partnatts; i++) for (i = 0; i < partnatts; i++)
isnull[i] = bms_is_member(i, nullkeys); isnull[i] = bms_is_member(i, nullkeys);
greatest_modulus = get_hash_partition_greatest_modulus(boundinfo);
rowHash = compute_partition_hash_value(partnatts, partsupfunc, partcollation, rowHash = compute_partition_hash_value(partnatts, partsupfunc, partcollation,
values, isnull); values, isnull);
greatest_modulus = boundinfo->nindexes;
if (partindices[rowHash % greatest_modulus] >= 0) if (partindices[rowHash % greatest_modulus] >= 0)
result->bound_offsets = result->bound_offsets =
bms_make_singleton(rowHash % greatest_modulus); bms_make_singleton(rowHash % greatest_modulus);
} }
else else
{ {
/* Getting here means at least one hash partition exists. */ /* Report all valid offsets into the boundinfo->indexes array. */
Assert(boundinfo->ndatums > 0);
result->bound_offsets = bms_add_range(NULL, 0, result->bound_offsets = bms_add_range(NULL, 0,
boundinfo->ndatums - 1); boundinfo->nindexes - 1);
} }
/* /*
...@@ -3388,30 +3390,20 @@ perform_pruning_combine_step(PartitionPruneContext *context, ...@@ -3388,30 +3390,20 @@ perform_pruning_combine_step(PartitionPruneContext *context,
PartitionPruneStepCombine *cstep, PartitionPruneStepCombine *cstep,
PruneStepResult **step_results) PruneStepResult **step_results)
{ {
ListCell *lc1; PruneStepResult *result = (PruneStepResult *) palloc0(sizeof(PruneStepResult));
PruneStepResult *result = NULL;
bool firststep; bool firststep;
ListCell *lc1;
/* /*
* A combine step without any source steps is an indication to not perform * A combine step without any source steps is an indication to not perform
* any partition pruning. Return all datum indexes in that case. * any partition pruning. Return all datum indexes in that case.
*/ */
result = (PruneStepResult *) palloc0(sizeof(PruneStepResult)); if (cstep->source_stepids == NIL)
if (list_length(cstep->source_stepids) == 0)
{ {
PartitionBoundInfo boundinfo = context->boundinfo; PartitionBoundInfo boundinfo = context->boundinfo;
int rangemax;
/*
* Add all valid offsets into the boundinfo->indexes array. For range
* partitioning, boundinfo->indexes contains (boundinfo->ndatums + 1)
* valid entries; otherwise there are boundinfo->ndatums.
*/
rangemax = context->strategy == PARTITION_STRATEGY_RANGE ?
boundinfo->ndatums : boundinfo->ndatums - 1;
result->bound_offsets = result->bound_offsets =
bms_add_range(result->bound_offsets, 0, rangemax); bms_add_range(NULL, 0, boundinfo->nindexes - 1);
result->scan_default = partition_bound_has_default(boundinfo); result->scan_default = partition_bound_has_default(boundinfo);
result->scan_null = partition_bound_accepts_nulls(boundinfo); result->scan_null = partition_bound_accepts_nulls(boundinfo);
return result; return result;
......
...@@ -30,7 +30,7 @@ struct RelOptInfo; /* avoid including pathnodes.h here */ ...@@ -30,7 +30,7 @@ struct RelOptInfo; /* avoid including pathnodes.h here */
* In the case of range partitioning, ndatums will typically be far less than * In the case of range partitioning, ndatums will typically be far less than
* 2 * nparts, because a partition's upper bound and the next partition's lower * 2 * nparts, because a partition's upper bound and the next partition's lower
* bound are the same in most common cases, and we only store one of them (the * bound are the same in most common cases, and we only store one of them (the
* upper bound). In case of hash partitioning, ndatums will be same as the * upper bound). In case of hash partitioning, ndatums will be the same as the
* number of partitions. * number of partitions.
* *
* For range and list partitioned tables, datums is an array of datum-tuples * For range and list partitioned tables, datums is an array of datum-tuples
...@@ -46,24 +46,31 @@ struct RelOptInfo; /* avoid including pathnodes.h here */ ...@@ -46,24 +46,31 @@ struct RelOptInfo; /* avoid including pathnodes.h here */
* the partition key's operator classes and collations. * the partition key's operator classes and collations.
* *
* In the case of list partitioning, the indexes array stores one entry for * In the case of list partitioning, the indexes array stores one entry for
* every datum, which is the index of the partition that accepts a given datum. * each datum-array entry, which is the index of the partition that accepts
* In case of range partitioning, it stores one entry per distinct range * rows matching that datum. So nindexes == ndatums.
* datum, which is the index of the partition for which a given datum *
* is an upper bound. In the case of hash partitioning, the number of the * In the case of range partitioning, the indexes array stores one entry per
* entries in the indexes array is same as the greatest modulus amongst all * distinct range datum, which is the index of the partition for which that
* partitions. For a given partition key datum-tuple, the index of the * datum is an upper bound (or -1 for a "gap" that has no partition). It is
* partition which would accept that datum-tuple would be given by the entry * convenient to have an extra -1 entry representing values above the last
* pointed by remainder produced when hash value of the datum-tuple is divided * range datum, so nindexes == ndatums + 1.
* by the greatest modulus. *
* In the case of hash partitioning, the number of entries in the indexes
* array is the same as the greatest modulus amongst all partitions (which
* is a multiple of all partition moduli), so nindexes == greatest modulus.
* The indexes array is indexed according to the hash key's remainder modulo
* the greatest modulus, and it contains either the partition index accepting
* that remainder, or -1 if there is no partition for that remainder.
*/ */
typedef struct PartitionBoundInfoData typedef struct PartitionBoundInfoData
{ {
char strategy; /* hash, list or range? */ char strategy; /* hash, list or range? */
int ndatums; /* Length of the datums following array */ int ndatums; /* Length of the datums[] array */
Datum **datums; Datum **datums;
PartitionRangeDatumKind **kind; /* The kind of each range bound datum; PartitionRangeDatumKind **kind; /* The kind of each range bound datum;
* NULL for hash and list partitioned * NULL for hash and list partitioned
* tables */ * tables */
int nindexes; /* Length of the indexes[] array */
int *indexes; /* Partition indexes */ int *indexes; /* Partition indexes */
int null_index; /* Index of the null-accepting partition; -1 int null_index; /* Index of the null-accepting partition; -1
* if there isn't one */ * if there isn't one */
......
...@@ -1538,26 +1538,27 @@ drop table lp, coll_pruning, rlp, mc3p, mc2p, boolpart, boolrangep, rp, coll_pru ...@@ -1538,26 +1538,27 @@ drop table lp, coll_pruning, rlp, mc3p, mc2p, boolpart, boolrangep, rp, coll_pru
-- result on different machines. See the definitions of -- result on different machines. See the definitions of
-- part_part_test_int4_ops and part_test_text_ops in insert.sql. -- part_part_test_int4_ops and part_test_text_ops in insert.sql.
-- --
create table hp (a int, b text) partition by hash (a part_test_int4_ops, b part_test_text_ops); create table hp (a int, b text, c int)
partition by hash (a part_test_int4_ops, b part_test_text_ops);
create table hp0 partition of hp for values with (modulus 4, remainder 0); create table hp0 partition of hp for values with (modulus 4, remainder 0);
create table hp3 partition of hp for values with (modulus 4, remainder 3); create table hp3 partition of hp for values with (modulus 4, remainder 3);
create table hp1 partition of hp for values with (modulus 4, remainder 1); create table hp1 partition of hp for values with (modulus 4, remainder 1);
create table hp2 partition of hp for values with (modulus 4, remainder 2); create table hp2 partition of hp for values with (modulus 4, remainder 2);
insert into hp values (null, null); insert into hp values (null, null, 0);
insert into hp values (1, null); insert into hp values (1, null, 1);
insert into hp values (1, 'xxx'); insert into hp values (1, 'xxx', 2);
insert into hp values (null, 'xxx'); insert into hp values (null, 'xxx', 3);
insert into hp values (2, 'xxx'); insert into hp values (2, 'xxx', 4);
insert into hp values (1, 'abcde'); insert into hp values (1, 'abcde', 5);
select tableoid::regclass, * from hp order by 1; select tableoid::regclass, * from hp order by c;
tableoid | a | b tableoid | a | b | c
----------+---+------- ----------+---+-------+---
hp0 | | hp0 | | | 0
hp0 | 1 | xxx hp1 | 1 | | 1
hp3 | 2 | xxx hp0 | 1 | xxx | 2
hp1 | 1 | hp2 | | xxx | 3
hp2 | | xxx hp3 | 2 | xxx | 4
hp2 | 1 | abcde hp2 | 1 | abcde | 5
(6 rows) (6 rows)
-- partial keys won't prune, nor would non-equality conditions -- partial keys won't prune, nor would non-equality conditions
...@@ -1715,6 +1716,33 @@ explain (costs off) select * from hp where (a = 1 and b = 'abcde') or (a = 2 and ...@@ -1715,6 +1716,33 @@ explain (costs off) select * from hp where (a = 1 and b = 'abcde') or (a = 2 and
Filter: (((a = 1) AND (b = 'abcde'::text)) OR ((a = 2) AND (b = 'xxx'::text)) OR ((a IS NULL) AND (b IS NULL))) Filter: (((a = 1) AND (b = 'abcde'::text)) OR ((a = 2) AND (b = 'xxx'::text)) OR ((a IS NULL) AND (b IS NULL)))
(7 rows) (7 rows)
-- test pruning when not all the partitions exist
drop table hp1;
drop table hp3;
explain (costs off) select * from hp where a = 1 and b = 'abcde';
QUERY PLAN
---------------------------------------------
Seq Scan on hp2 hp
Filter: ((a = 1) AND (b = 'abcde'::text))
(2 rows)
explain (costs off) select * from hp where a = 1 and b = 'abcde' and
(c = 2 or c = 3);
QUERY PLAN
----------------------------------------------------------------------
Seq Scan on hp2 hp
Filter: ((a = 1) AND (b = 'abcde'::text) AND ((c = 2) OR (c = 3)))
(2 rows)
drop table hp2;
explain (costs off) select * from hp where a = 1 and b = 'abcde' and
(c = 2 or c = 3);
QUERY PLAN
--------------------------
Result
One-Time Filter: false
(2 rows)
drop table hp; drop table hp;
-- --
-- Test runtime partition pruning -- Test runtime partition pruning
......
...@@ -304,19 +304,20 @@ drop table lp, coll_pruning, rlp, mc3p, mc2p, boolpart, boolrangep, rp, coll_pru ...@@ -304,19 +304,20 @@ drop table lp, coll_pruning, rlp, mc3p, mc2p, boolpart, boolrangep, rp, coll_pru
-- part_part_test_int4_ops and part_test_text_ops in insert.sql. -- part_part_test_int4_ops and part_test_text_ops in insert.sql.
-- --
create table hp (a int, b text) partition by hash (a part_test_int4_ops, b part_test_text_ops); create table hp (a int, b text, c int)
partition by hash (a part_test_int4_ops, b part_test_text_ops);
create table hp0 partition of hp for values with (modulus 4, remainder 0); create table hp0 partition of hp for values with (modulus 4, remainder 0);
create table hp3 partition of hp for values with (modulus 4, remainder 3); create table hp3 partition of hp for values with (modulus 4, remainder 3);
create table hp1 partition of hp for values with (modulus 4, remainder 1); create table hp1 partition of hp for values with (modulus 4, remainder 1);
create table hp2 partition of hp for values with (modulus 4, remainder 2); create table hp2 partition of hp for values with (modulus 4, remainder 2);
insert into hp values (null, null); insert into hp values (null, null, 0);
insert into hp values (1, null); insert into hp values (1, null, 1);
insert into hp values (1, 'xxx'); insert into hp values (1, 'xxx', 2);
insert into hp values (null, 'xxx'); insert into hp values (null, 'xxx', 3);
insert into hp values (2, 'xxx'); insert into hp values (2, 'xxx', 4);
insert into hp values (1, 'abcde'); insert into hp values (1, 'abcde', 5);
select tableoid::regclass, * from hp order by 1; select tableoid::regclass, * from hp order by c;
-- partial keys won't prune, nor would non-equality conditions -- partial keys won't prune, nor would non-equality conditions
explain (costs off) select * from hp where a = 1; explain (costs off) select * from hp where a = 1;
...@@ -337,6 +338,16 @@ explain (costs off) select * from hp where a = 2 and b = 'xxx'; ...@@ -337,6 +338,16 @@ explain (costs off) select * from hp where a = 2 and b = 'xxx';
explain (costs off) select * from hp where a = 1 and b = 'abcde'; explain (costs off) select * from hp where a = 1 and b = 'abcde';
explain (costs off) select * from hp where (a = 1 and b = 'abcde') or (a = 2 and b = 'xxx') or (a is null and b is null); explain (costs off) select * from hp where (a = 1 and b = 'abcde') or (a = 2 and b = 'xxx') or (a is null and b is null);
-- test pruning when not all the partitions exist
drop table hp1;
drop table hp3;
explain (costs off) select * from hp where a = 1 and b = 'abcde';
explain (costs off) select * from hp where a = 1 and b = 'abcde' and
(c = 2 or c = 3);
drop table hp2;
explain (costs off) select * from hp where a = 1 and b = 'abcde' and
(c = 2 or c = 3);
drop table hp; drop table hp;
-- --
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment