postgres/src/include/partitioning/partbounds.h

/*-------------------------------------------------------------------------
 *
 * partbounds.h
 *
 * Copyright (c) 2007-2018, PostgreSQL Global Development Group
 *
 * src/include/partitioning/partbounds.h
 *
 *-------------------------------------------------------------------------
 */
#ifndef PARTBOUNDS_H
#define PARTBOUNDS_H

#include "fmgr.h"
#include "nodes/parsenodes.h"
#include "nodes/pg_list.h"
#include "partitioning/partdefs.h"
#include "utils/relcache.h"


/*
 * PartitionBoundInfoData encapsulates a set of partition bounds. It is
 * usually associated with partitioned tables as part of its partition
 * descriptor, but may also be used to represent a virtual partitioned
 * table such as a partitioned joinrel within the planner.
 *
 * A list partition datum that is known to be NULL is never put into the
 * datums array. Instead, it is tracked using the null_index field.
 *
 * In the case of range partitioning, ndatums will typically be far less than
 * 2 * nparts, because a partition's upper bound and the next partition's lower
 * bound are the same in most common cases, and we only store one of them (the
 * upper bound).  In case of hash partitioning, ndatums will be same as the
 * number of partitions.
 *
 * For range and list partitioned tables, datums is an array of datum-tuples
 * with key->partnatts datums each.  For hash partitioned tables, it is an array
 * of datum-tuples with 2 datums, modulus and remainder, corresponding to a
 * given partition.
 *
 * The datums in datums array are arranged in increasing order as defined by
 * functions qsort_partition_rbound_cmp(), qsort_partition_list_value_cmp() and
 * qsort_partition_hbound_cmp() for range, list and hash partitioned tables
 * respectively. For range and list partitions this simply means that the
 * datums in the datums array are arranged in increasing order as defined by
 * the partition key's operator classes and collations.
 *
 * In the case of list partitioning, the indexes array stores one entry for
 * every datum, which is the index of the partition that accepts a given datum.
 * In case of range partitioning, it stores one entry per distinct range
 * datum, which is the index of the partition for which a given datum
 * is an upper bound.  In the case of hash partitioning, the number of the
 * entries in the indexes array is same as the greatest modulus amongst all
 * partitions.  For a given partition key datum-tuple, the index of the
 * partition which would accept that datum-tuple would be given by the entry
 * pointed by remainder produced when hash value of the datum-tuple is divided
 * by the greatest modulus.
 */

typedef struct PartitionBoundInfoData
{
	char		strategy;		/* hash, list or range? */
	int			ndatums;		/* Length of the datums following array */
	Datum	  **datums;
	PartitionRangeDatumKind **kind; /* The kind of each range bound datum;
									 * NULL for hash and list partitioned
									 * tables */
	int		   *indexes;		/* Partition indexes */
	int			null_index;		/* Index of the null-accepting partition; -1
								 * if there isn't one */
	int			default_index;	/* Index of the default partition; -1 if there
								 * isn't one */
} PartitionBoundInfoData;

#define partition_bound_accepts_nulls(bi) ((bi)->null_index != -1)
#define partition_bound_has_default(bi) ((bi)->default_index != -1)

/*
 * When qsort'ing partition bounds after reading from the catalog, each bound
 * is represented with one of the following structs.
 */

/* One bound of a hash partition */
typedef struct PartitionHashBound
{
	int			modulus;
	int			remainder;
	int			index;
} PartitionHashBound;

/* One value coming from some (index'th) list partition */
typedef struct PartitionListValue
{
	int			index;
	Datum		value;
} PartitionListValue;

/* One bound of a range partition */
typedef struct PartitionRangeBound
{
	int			index;
	Datum	   *datums;			/* range bound datums */
	PartitionRangeDatumKind *kind;	/* the kind of each datum */
	bool		lower;			/* this is the lower (vs upper) bound */
} PartitionRangeBound;

extern int	get_hash_partition_greatest_modulus(PartitionBoundInfo b);
extern uint64 compute_hash_value(int partnatts, FmgrInfo *partsupfunc,
				   Datum *values, bool *isnull);
extern List *get_qual_from_partbound(Relation rel, Relation parent,
						PartitionBoundSpec *spec);
extern bool partition_bounds_equal(int partnatts, int16 *parttyplen,
					   bool *parttypbyval, PartitionBoundInfo b1,
					   PartitionBoundInfo b2);
extern PartitionBoundInfo partition_bounds_copy(PartitionBoundInfo src,
					  PartitionKey key);
extern void check_new_partition_bound(char *relname, Relation parent,
						  PartitionBoundSpec *spec);
extern void check_default_allows_bound(Relation parent, Relation defaultRel,
						   PartitionBoundSpec *new_spec);

extern PartitionRangeBound *make_one_range_bound(PartitionKey key, int index,
					 List *datums, bool lower);
extern int32 partition_hbound_cmp(int modulus1, int remainder1, int modulus2,
					 int remainder2);
extern int32 partition_rbound_cmp(int partnatts, FmgrInfo *partsupfunc,
					 Oid *partcollation, Datum *datums1,
					 PartitionRangeDatumKind *kind1, bool lower1,
					 PartitionRangeBound *b2);
extern int32 partition_rbound_datum_cmp(FmgrInfo *partsupfunc,
						   Oid *partcollation,
						   Datum *rb_datums, PartitionRangeDatumKind *rb_kind,
						   Datum *tuple_datums, int n_tuple_datums);
extern int partition_list_bsearch(FmgrInfo *partsupfunc,
					   Oid *partcollation,
					   PartitionBoundInfo boundinfo,
					   Datum value, bool *is_equal);
extern int partition_range_bsearch(int partnatts, FmgrInfo *partsupfunc,
						Oid *partcollation,
						PartitionBoundInfo boundinfo,
						PartitionRangeBound *probe, bool *is_equal);
extern int partition_range_datum_bsearch(FmgrInfo *partsupfunc,
							  Oid *partcollation,
							  PartitionBoundInfo boundinfo,
							  int nvalues, Datum *values, bool *is_equal);
extern int partition_hash_bsearch(PartitionBoundInfo boundinfo,
					   int modulus, int remainder);

#endif							/* PARTBOUNDS_H */
Faster partition pruning Add a new module backend/partitioning/partprune.c, implementing a more sophisticated algorithm for partition pruning. The new module uses each partition's "boundinfo" for pruning instead of constraint exclusion, based on an idea proposed by Robert Haas of a "pruning program": a list of steps generated from the query quals which are run iteratively to obtain a list of partitions that must be scanned in order to satisfy those quals. At present, this targets planner-time partition pruning, but there exist further patches to apply partition pruning at execution time as well. This commit also moves some definitions from include/catalog/partition.h to a new file include/partitioning/partbounds.h, in an attempt to rationalize partitioning related code. Authors: Amit Langote, David Rowley, Dilip Kumar Reviewers: Robert Haas, Kyotaro Horiguchi, Ashutosh Bapat, Jesper Pedersen. Discussion: https://postgr.es/m/098b9c71-1915-1a2a-8d52-1a7a50ce79e8@lab.ntt.co.jp 8 years ago			`/*-------------------------------------------------------------------------`
			`*`
			`* partbounds.h`
			`*`
			`* Copyright (c) 2007-2018, PostgreSQL Global Development Group`
			`*`
			`* src/include/partitioning/partbounds.h`
			`*`
			`*-------------------------------------------------------------------------`
			`*/`
			`#ifndef PARTBOUNDS_H`
			`#define PARTBOUNDS_H`

Reorganize partitioning code There's been a massive addition of partitioning code in PostgreSQL 11, with little oversight on its placement, resulting in a catalog/partition.c with poorly defined boundaries and responsibilities. This commit tries to set a couple of distinct modules to separate things a little bit. There are no code changes here, only code movement. There are three new files: src/backend/utils/cache/partcache.c src/include/partitioning/partdefs.h src/include/utils/partcache.h The previous arrangement of #including catalog/partition.h almost everywhere is no more. Authors: Amit Langote and Álvaro Herrera Discussion: https://postgr.es/m/98e8d509-790a-128c-be7f-e48a5b2d8d97@lab.ntt.co.jp https://postgr.es/m/11aa0c50-316b-18bb-722d-c23814f39059@lab.ntt.co.jp https://postgr.es/m/143ed9a4-6038-76d4-9a55-502035815e68@lab.ntt.co.jp https://postgr.es/m/20180413193503.nynq7bnmgh6vs5vm@alvherre.pgsql 8 years ago			`#include "fmgr.h"`
			`#include "nodes/parsenodes.h"`
			`#include "nodes/pg_list.h"`
			`#include "partitioning/partdefs.h"`
			`#include "utils/relcache.h"`
Faster partition pruning Add a new module backend/partitioning/partprune.c, implementing a more sophisticated algorithm for partition pruning. The new module uses each partition's "boundinfo" for pruning instead of constraint exclusion, based on an idea proposed by Robert Haas of a "pruning program": a list of steps generated from the query quals which are run iteratively to obtain a list of partitions that must be scanned in order to satisfy those quals. At present, this targets planner-time partition pruning, but there exist further patches to apply partition pruning at execution time as well. This commit also moves some definitions from include/catalog/partition.h to a new file include/partitioning/partbounds.h, in an attempt to rationalize partitioning related code. Authors: Amit Langote, David Rowley, Dilip Kumar Reviewers: Robert Haas, Kyotaro Horiguchi, Ashutosh Bapat, Jesper Pedersen. Discussion: https://postgr.es/m/098b9c71-1915-1a2a-8d52-1a7a50ce79e8@lab.ntt.co.jp 8 years ago

			`/*`
			`* PartitionBoundInfoData encapsulates a set of partition bounds. It is`
			`* usually associated with partitioned tables as part of its partition`
			`* descriptor, but may also be used to represent a virtual partitioned`
			`* table such as a partitioned joinrel within the planner.`
			`*`
			`* A list partition datum that is known to be NULL is never put into the`
			`* datums array. Instead, it is tracked using the null_index field.`
			`*`
			`* In the case of range partitioning, ndatums will typically be far less than`
			`* 2 * nparts, because a partition's upper bound and the next partition's lower`
			`* bound are the same in most common cases, and we only store one of them (the`
			`* upper bound). In case of hash partitioning, ndatums will be same as the`
			`* number of partitions.`
			`*`
			`* For range and list partitioned tables, datums is an array of datum-tuples`
			`* with key->partnatts datums each. For hash partitioned tables, it is an array`
			`* of datum-tuples with 2 datums, modulus and remainder, corresponding to a`
			`* given partition.`
			`*`
			`* The datums in datums array are arranged in increasing order as defined by`
			`* functions qsort_partition_rbound_cmp(), qsort_partition_list_value_cmp() and`
			`* qsort_partition_hbound_cmp() for range, list and hash partitioned tables`
			`* respectively. For range and list partitions this simply means that the`
			`* datums in the datums array are arranged in increasing order as defined by`
			`* the partition key's operator classes and collations.`
			`*`
			`* In the case of list partitioning, the indexes array stores one entry for`
			`* every datum, which is the index of the partition that accepts a given datum.`
			`* In case of range partitioning, it stores one entry per distinct range`
			`* datum, which is the index of the partition for which a given datum`
			`* is an upper bound. In the case of hash partitioning, the number of the`
			`* entries in the indexes array is same as the greatest modulus amongst all`
			`* partitions. For a given partition key datum-tuple, the index of the`
			`* partition which would accept that datum-tuple would be given by the entry`
			`* pointed by remainder produced when hash value of the datum-tuple is divided`
			`* by the greatest modulus.`
			`*/`

			`typedef struct PartitionBoundInfoData`
			`{`
			`char strategy; /* hash, list or range? */`
			`int ndatums; /* Length of the datums following array */`
			`Datum **datums;`
			`PartitionRangeDatumKind *kind; / The kind of each range bound datum;`
			`* NULL for hash and list partitioned`
			`* tables */`
			`int indexes; / Partition indexes */`
			`int null_index; /* Index of the null-accepting partition; -1`
			`* if there isn't one */`
			`int default_index; /* Index of the default partition; -1 if there`
			`* isn't one */`
			`} PartitionBoundInfoData;`

			`#define partition_bound_accepts_nulls(bi) ((bi)->null_index != -1)`
			`#define partition_bound_has_default(bi) ((bi)->default_index != -1)`

			`/*`
			`* When qsort'ing partition bounds after reading from the catalog, each bound`
			`* is represented with one of the following structs.`
			`*/`

			`/* One bound of a hash partition */`
			`typedef struct PartitionHashBound`
			`{`
			`int modulus;`
			`int remainder;`
			`int index;`
			`} PartitionHashBound;`

			`/* One value coming from some (index'th) list partition */`
			`typedef struct PartitionListValue`
			`{`
			`int index;`
			`Datum value;`
			`} PartitionListValue;`

			`/* One bound of a range partition */`
			`typedef struct PartitionRangeBound`
			`{`
			`int index;`
			`Datum datums; / range bound datums */`
			`PartitionRangeDatumKind kind; / the kind of each datum */`
			`bool lower; /* this is the lower (vs upper) bound */`
			`} PartitionRangeBound;`

			`extern int get_hash_partition_greatest_modulus(PartitionBoundInfo b);`
Reorganize partitioning code There's been a massive addition of partitioning code in PostgreSQL 11, with little oversight on its placement, resulting in a catalog/partition.c with poorly defined boundaries and responsibilities. This commit tries to set a couple of distinct modules to separate things a little bit. There are no code changes here, only code movement. There are three new files: src/backend/utils/cache/partcache.c src/include/partitioning/partdefs.h src/include/utils/partcache.h The previous arrangement of #including catalog/partition.h almost everywhere is no more. Authors: Amit Langote and Álvaro Herrera Discussion: https://postgr.es/m/98e8d509-790a-128c-be7f-e48a5b2d8d97@lab.ntt.co.jp https://postgr.es/m/11aa0c50-316b-18bb-722d-c23814f39059@lab.ntt.co.jp https://postgr.es/m/143ed9a4-6038-76d4-9a55-502035815e68@lab.ntt.co.jp https://postgr.es/m/20180413193503.nynq7bnmgh6vs5vm@alvherre.pgsql 8 years ago			`extern uint64 compute_hash_value(int partnatts, FmgrInfo *partsupfunc,`
			`Datum values, bool isnull);`
			`extern List *get_qual_from_partbound(Relation rel, Relation parent,`
			`PartitionBoundSpec *spec);`
			`extern bool partition_bounds_equal(int partnatts, int16 *parttyplen,`
			`bool *parttypbyval, PartitionBoundInfo b1,`
			`PartitionBoundInfo b2);`
			`extern PartitionBoundInfo partition_bounds_copy(PartitionBoundInfo src,`
			`PartitionKey key);`
			`extern void check_new_partition_bound(char *relname, Relation parent,`
			`PartitionBoundSpec *spec);`
			`extern void check_default_allows_bound(Relation parent, Relation defaultRel,`
			`PartitionBoundSpec *new_spec);`

			`extern PartitionRangeBound *make_one_range_bound(PartitionKey key, int index,`
			`List *datums, bool lower);`
			`extern int32 partition_hbound_cmp(int modulus1, int remainder1, int modulus2,`
			`int remainder2);`
			`extern int32 partition_rbound_cmp(int partnatts, FmgrInfo *partsupfunc,`
			`Oid partcollation, Datum datums1,`
			`PartitionRangeDatumKind *kind1, bool lower1,`
			`PartitionRangeBound *b2);`
			`extern int32 partition_rbound_datum_cmp(FmgrInfo *partsupfunc,`
			`Oid *partcollation,`
			`Datum rb_datums, PartitionRangeDatumKind rb_kind,`
			`Datum *tuple_datums, int n_tuple_datums);`
			`extern int partition_list_bsearch(FmgrInfo *partsupfunc,`
			`Oid *partcollation,`
Faster partition pruning Add a new module backend/partitioning/partprune.c, implementing a more sophisticated algorithm for partition pruning. The new module uses each partition's "boundinfo" for pruning instead of constraint exclusion, based on an idea proposed by Robert Haas of a "pruning program": a list of steps generated from the query quals which are run iteratively to obtain a list of partitions that must be scanned in order to satisfy those quals. At present, this targets planner-time partition pruning, but there exist further patches to apply partition pruning at execution time as well. This commit also moves some definitions from include/catalog/partition.h to a new file include/partitioning/partbounds.h, in an attempt to rationalize partitioning related code. Authors: Amit Langote, David Rowley, Dilip Kumar Reviewers: Robert Haas, Kyotaro Horiguchi, Ashutosh Bapat, Jesper Pedersen. Discussion: https://postgr.es/m/098b9c71-1915-1a2a-8d52-1a7a50ce79e8@lab.ntt.co.jp 8 years ago			`PartitionBoundInfo boundinfo,`
			`Datum value, bool *is_equal);`
			`extern int partition_range_bsearch(int partnatts, FmgrInfo *partsupfunc,`
			`Oid *partcollation,`
			`PartitionBoundInfo boundinfo,`
			`PartitionRangeBound probe, bool is_equal);`
			`extern int partition_range_datum_bsearch(FmgrInfo *partsupfunc,`
			`Oid *partcollation,`
			`PartitionBoundInfo boundinfo,`
			`int nvalues, Datum values, bool is_equal);`
			`extern int partition_hash_bsearch(PartitionBoundInfo boundinfo,`
			`int modulus, int remainder);`

			`#endif /* PARTBOUNDS_H */`