src/backend/commands/analyzeutils.c - hawq - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one
  * or more contributor license agreements.  See the NOTICE file
  * distributed with this work for additional information
  * regarding copyright ownership.  The ASF licenses this file
  * to you under the Apache License, Version 2.0 (the
  * "License"); you may not use this file except in compliance
  * with the License.  You may obtain a copy of the License at
  *
  *   http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing,
  * software distributed under the License is distributed on an
  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
  * KIND, either express or implied.  See the License for the
  * specific language governing permissions and limitations
  * under the License.
  */
 /*-------------------------------------------------------------------------
  *
  * analyzeutils.c
  *
  *	  Provides utils functions for analyze.c
  *
  *-------------------------------------------------------------------------
  */
 #include "postgres.h"
 #include "access/heapam.h"
 #include "access/hash.h"
 #include "catalog/pg_statistic.h"
 #include "utils/array.h"
 #include "utils/lsyscache.h"
 #include "utils/datum.h"
 #include "utils/dynahash.h"
 #include "utils/hsearch.h"
 #include "cdb/cdbhash.h"
 #include "cdb/cdbheap.h"
 #include "cdb/cdbpartition.h"
 #include "parser/parse_oper.h"

 #include "commands/analyzeutils.h"

 typedef struct TypInfo
 {
 	Oid typOid;
 	bool typbyval;
 	int16 typlen;
 	Oid ltFuncOp; /* oid of 'less than' operator function id of this type */
 	Oid eqFuncOp; /* oid of equality operator function id of this type */
 } TypInfo;

 /* Functions and structures used for aggregating leaf partition stats */
 typedef struct MCVFreqPair
 {
 	Datum mcv;
 	float4 count;
 	TypInfo *typinfo; /* type information of datum type */
 } MCVFreqPair;

 typedef struct MCVFreqEntry
 {
 	MCVFreqPair *entry;
 } MCVFreqEntry;

 typedef struct PartDatum
 {
 	int partId; /* id of the partition histogram where the datum is from */
 	Datum datum;
 } PartDatum;

 static ArrayType* buildMCVArrayForStatsEntry(MCVFreqPair** mcvpairArray, int nEntries, Oid typoid);
 static ArrayType* buildFreqArrayForStatsEntry(MCVFreqPair** mcvpairArray, int nEntries, float4 reltuples);
 static int datumHashTableMatch(const void*keyPtr1, const void *keyPtr2, Size keysize);
 static uint32 datumHashTableHash(const void *keyPtr, Size keysize);
 static void calculateHashWithHashAny(void *clientData, void *buf, size_t len);
 static HTAB* createDatumHashTable(unsigned int nEntries);
 static MCVFreqPair* MCVFreqPairCopy(MCVFreqPair* mfp);
 static bool containsDatum(HTAB *datumHash, MCVFreqPair *mfp);
 static void addAllMCVsToHashTable
 	(
 	HTAB *datumHash,
 	Oid partOid,
 	HeapTuple heaptupleStats,
 	TypInfo *typInfo,
 	float4 *partReltuples
 	);
 static void addMCVToHashTable(HTAB* datumHash, MCVFreqPair *mfp);
 static int mcvpair_cmp(const void *a, const void *b);

 static void getHistogramHeapTuple(List *lRelOids,
 		Datum **histData,
 		int *nBounds,
 		TypInfo *typInfo,
 		AttrNumber attnum,
 		float4 *partsReltuples,
 		float4 *sumReltuples,
 		int *numNotNullParts);
 static void initTypInfo(TypInfo *typInfo, Oid typOid);
 static int getNextPartDatum(CdbHeap *hp);
 static void initDatumHeap(CdbHeap *hp, Datum **histData, int *cursors, int nParts);
 static int DatumHeapComparator(void *lhs, void *rhs, void *context);
 static void advanceCursor(int pid, int *cursors, int *nBounds);
 static Datum getMinBound(Datum **histData, int *cursors, int *nBounds, int nParts, Oid ltFuncOid);
 static Datum getMaxBound(Datum **histData, int *nBounds, int nParts, Oid ltFuncOid);
 static ArrayType *buildHistogramEntryForStats(List *ldatum,	TypInfo *typInfo);

 /*
  * Given column stats of an attribute, build an MCVFreqPair and add it to the hash table.
  * If the MCV to be added already exist in the hash table, we increment its count value.
  * Input:
  * 	- datumHash: hash table
  * 	- partOid: Oid of current partition
  * 	- typInfo: type information
  * Output:
  *  - partReltuples: the number of tuples in this partition
  */
 static void
 addAllMCVsToHashTable
 	(
 	HTAB *datumHash,
 	Oid partOid,
 	HeapTuple heaptupleStats,
 	TypInfo *typInfo,
 	float4 *partReltuples
 	)
 {
 	float4 reltuples = get_rel_reltuples(partOid);
 	*partReltuples = reltuples;
 	Datum	   *datumMCVs = NULL;
 	int			numMCVs = 0;
 	float4	   *freqs = NULL;
 	int			numFreqs = 0;

 	(void)	get_attstatsslot
 			(
 			heaptupleStats,
 			typInfo->typOid,
 			-1,
 			STATISTIC_KIND_MCV,
 			InvalidOid,
 			&datumMCVs, &numMCVs,
 			&freqs, &numFreqs
 			);

 	Assert(numMCVs == numFreqs);
 	for (int i = 0; i < numMCVs; i++)
 	{
 		Datum mcv = datumMCVs[i];
 		float4 count = reltuples * freqs[i];
 		MCVFreqPair *mfp = (MCVFreqPair *) palloc(sizeof(MCVFreqPair));
 		mfp->mcv = mcv;
 		mfp->count = count;
 		mfp->typinfo = typInfo;
 		addMCVToHashTable(datumHash, mfp);
 		pfree(mfp);
 	}
 	free_attstatsslot(typInfo->typOid, datumMCVs, numMCVs, freqs, numFreqs);
 }


 /*
  * Main function for aggregating leaf partition MCV/Freq to compute
  * root or interior partition MCV/Freq
  * Input:
  * 	- relationOid: Oid of root or interior partition
  * 	- attnum: column number
  * 	- nEntries: target number of MCVs/Freqs to be collected, the real number of
  * 	MCVs/Freqs returned may be less
  * Output:
  * 	- result: two dimensional arrays of MCVs and Freqs
  */
 void
 aggregate_leaf_partition_MCVs
 	(
 	Oid relationOid,
 	AttrNumber attnum,
 	unsigned int nEntries,
 	ArrayType **result
 	)
 {
 	List *lRelOids = rel_get_leaf_children_relids(relationOid); /* list of OIDs of leaf partitions */
 	Oid typoid = get_atttype(relationOid, attnum);
 	TypInfo *typInfo = (TypInfo*) palloc(sizeof(TypInfo));
 	initTypInfo(typInfo, typoid);

 	HTAB* datumHash = createDatumHashTable(nEntries);
 	float4 sumReltuples = 0;

 	ListCell *le = NULL;
 	foreach (le, lRelOids)
 	{
 		Oid partOid = lfirst_oid(le);
 		HeapTuple heaptupleStats = get_att_stats(partOid, attnum);
 		if (!HeapTupleIsValid(heaptupleStats))
 		{
 			continue;
 		}

 		float4 partReltuples = 0;
 		addAllMCVsToHashTable(datumHash, partOid, heaptupleStats, typInfo, &partReltuples);
 		heap_freetuple(heaptupleStats);
 		sumReltuples += partReltuples;
 	}

 	if (0 == hash_get_num_entries(datumHash))
 	{
 		/* in the unlikely event of an emtpy hash table, return early */
 		*result = NULL;
 		result++;
 		*result = NULL;
 		hash_destroy(datumHash);
 		return;
 	}

 	int i = 0;
 	HASH_SEQ_STATUS hash_seq;
 	MCVFreqEntry *mcvfreq;
 	MCVFreqPair **mcvpairArray = palloc(hash_get_num_entries(datumHash) * sizeof(MCVFreqPair*));

 	/* put MCVFreqPairs in an array in order to sort */
 	hash_seq_init(&hash_seq, datumHash);
 	while ((mcvfreq = hash_seq_search(&hash_seq)) != NULL)
 	{
 		mcvpairArray[i++] = mcvfreq->entry;
 	}
 	qsort(mcvpairArray, i, sizeof(MCVFreqPair *), mcvpair_cmp);

 	/* prepare returning MCV and Freq arrays */
 	*result = buildMCVArrayForStatsEntry(mcvpairArray, Min(i, nEntries), typoid);
 	Assert(*result);
 	result++; /* now switch to frequency array (result[1]) */
 	*result = buildFreqArrayForStatsEntry(mcvpairArray, Min(i, nEntries), sumReltuples);

 	hash_destroy(datumHash);
 	pfree(typInfo);
 	pfree(mcvpairArray);

 	return;
 }

 /*
  * Return an array of MCVs from the resultant MCVFreqPair array
  * Input:
  * 	- mcvpairArray: contains MCVs and corresponding counts in desc order
  * 	- nEntries: number of MCVs to be returned
  * 	- typoid: type oid of the MCV datum
  */
 static ArrayType *
 buildMCVArrayForStatsEntry
 	(
 	MCVFreqPair** mcvpairArray,
 	int nEntries,
 	Oid typoid
 	)
 {
 	ArrayType *out = NULL;

 	Assert(mcvpairArray);
 	Assert(nEntries > 0);

 	ArrayBuildState *astate = NULL;

 	for (int i = 0; i < nEntries; i++)
 	{
 		Datum mcv = (mcvpairArray[i])->mcv;
 		astate = accumArrayResult(astate, mcv, false, typoid, CurrentMemoryContext);
 	}

 	if (astate)
 	{
 		out = DatumGetArrayTypeP(makeArrayResult(astate, CurrentMemoryContext));
 	}

 	return out;
 }

 /*
  * Return an array of frequencies from the resultant MCVFreqPair array
  * Input:
  * 	- mcvpairArray: contains MCVs and corresponding counts in desc order
  * 	- nEntries: number of frequencies to be returned
  * 	- reltuples: number of tuples of the root or interior partition (all leaf partitions combined)
  */
 static ArrayType *
 buildFreqArrayForStatsEntry
 	(
 	MCVFreqPair** mcvpairArray,
 	int nEntries,
 	float4 reltuples
 	)
 {
 	Assert(mcvpairArray);
 	Assert(nEntries > 0);
 	Assert(reltuples > 0); /* otherwise ANALYZE will not collect stats */

 	ArrayType *out = NULL;
 	ArrayBuildState *astate = NULL;

 	for (int i = 0; i < nEntries; i++)
 	{
 		float4 freq = mcvpairArray[i]->count / reltuples;
 		astate = accumArrayResult(astate, Float4GetDatum(freq), false, FLOAT4OID, CurrentMemoryContext);
 	}

 	if (astate)
 	{
 		out = DatumGetArrayTypeP(makeArrayResult(astate, CurrentMemoryContext));
 	}

 	return out;
 }

 /*
  * Comparison function to sort an array of MCVFreqPairs in desc order
  */
 static int
 mcvpair_cmp(const void *a, const void *b)
 {
 	Assert(a);
 	Assert(b);

 	MCVFreqPair *mfp1 = *(MCVFreqPair **)a;
 	MCVFreqPair *mfp2 = *(MCVFreqPair **)b;
 	if (mfp1->count > mfp2->count)
 		return -1;
 	if (mfp1->count < mfp2->count)
 		return 1;
 	else
 		return 0;
 }

 /**
  * Add an MCVFreqPair to the hash table, if the same datum already exists
  * in the hash table, update its count
  * Input:
  * 	datumHash - hash table
  * 	mfp - MCVFreqPair to be added
  * 	typbyval - whether the datum inside is passed by value
  * 	typlen - pg_type.typlen of the datum type
  */
 static void
 addMCVToHashTable(HTAB* datumHash, MCVFreqPair *mfp)
 {
 	Assert(datumHash);
 	Assert(mfp);

 	MCVFreqEntry *mcvfreq;
 	bool found = false; /* required by hash_search */

 	if (!containsDatum(datumHash, mfp))
 	{
 		/* create a deep copy of MCVFreqPair and put it in the hash table */
 		MCVFreqPair *key = MCVFreqPairCopy(mfp);
 		mcvfreq = hash_search(datumHash, &key, HASH_ENTER, &found);
 		if (mcvfreq == NULL)
 		{
 			ereport(ERROR, (errcode(ERRCODE_OUT_OF_MEMORY), errmsg("out of memory")));
 		}
 		mcvfreq->entry = key;
 	}

 	else
 	{
 		mcvfreq = hash_search(datumHash, &mfp, HASH_FIND, &found);
 		Assert(mcvfreq);
 		mcvfreq->entry->count += mfp->count;
 	}

 	return;
 }

 /**
  * Copy function for MCVFreqPair
  * Input:
  * 	mfp - input MCVFreqPair
  * 	typbyval - whether the datum inside is passed by value
  * 	typlen - pg_type.typlen of the datum type
  * Output:
  * 	result - a deep copy of input MCVFreqPair
  */
 static MCVFreqPair *
 MCVFreqPairCopy(MCVFreqPair* mfp)
 {
 	MCVFreqPair *result = (MCVFreqPair*) palloc(sizeof(MCVFreqPair));
 	result->count = mfp->count;
 	result->typinfo = mfp->typinfo;
 	result->mcv = datumCopy(mfp->mcv, mfp->typinfo->typbyval, mfp->typinfo->typlen);

 	return result;
 }

 /**
  * Test whether an MCVFreqPair is in the hash table
  * Input:
  * 	datumHash - hash table
  * 	mfp - pointer to an MCVFreqPair
  * Output:
  * 	found - whether the MCVFreqPair is found
  */
 static bool
 containsDatum(HTAB *datumHash, MCVFreqPair *mfp)
 {
 	bool found = false;
 	if (datumHash != NULL)
 		hash_search(datumHash, &mfp, HASH_FIND, &found);

 	return found;
 }

 /**
  * Create a hash table with both hash key and hash entry as a pointer
  * to a MCVFreqPair struct
  * Input:
  * 	nEntries - estimated number of elements in the hash table, the size
  * 	of the hash table can grow dynamically
  * Output:
  * 	a pointer to the created hash table
  */
 static HTAB*
 createDatumHashTable(unsigned int nEntries)
 {
 	HASHCTL	hash_ctl;
 	MemSet(&hash_ctl, 0, sizeof(hash_ctl));

 	hash_ctl.keysize = sizeof(MCVFreqPair*);
 	hash_ctl.entrysize = sizeof(MCVFreqEntry);
 	hash_ctl.hash = datumHashTableHash;
 	hash_ctl.match = datumHashTableMatch;

 	return hash_create("DatumHashTable", nEntries, &hash_ctl, HASH_ELEM | HASH_FUNCTION | HASH_COMPARE);
 }

 /**
  * A generic hash function
  * Input:
  * 	buf - pointer to hash key
  * 	len - number of bytes to be hashed
  * Output:
  * 	clientData - hash value as an unsigned integer
  */
 static void
 calculateHashWithHashAny(void *clientData, void *buf, size_t len)
 {
 	uint32 *result = (uint32*) clientData;
 	*result = hash_any((unsigned char *)buf, len );
 }

 /**
  * Hash function for MCVFreqPair struct pointer.
  * Input:
  * 	keyPtr - pointer to hash key
  * 	keysize - not used, hash function must have this signature
  * Output:
  * 	result - hash value as an unsigned integer
  */
 static uint32
 datumHashTableHash(const void *keyPtr, Size keysize)
 {
 	uint32 result = 0;
 	MCVFreqPair *mfp = *((MCVFreqPair **)keyPtr);

 	hashDatum(mfp->mcv, mfp->typinfo->typOid, calculateHashWithHashAny, &result);

 	return result;
 }

 /**
  * Match function for MCVFreqPair struct pointer.
  * Input:
  * 	keyPtr1, keyPtr2 - pointers to two hash keys
  * 	keysize - not used, hash function must have this signature
  * Output:
  * 	0 if two hash keys match, 1 otherwise
  */
 static int
 datumHashTableMatch(const void *keyPtr1, const void *keyPtr2, Size keysize)
 {
 	Assert(keyPtr1);
 	Assert(keyPtr2);

 	MCVFreqPair *left = *((MCVFreqPair **)keyPtr1);
 	MCVFreqPair *right = *((MCVFreqPair **)keyPtr2);

 	Assert(left->typinfo->typOid == right->typinfo->typOid);

 	return datumCompare(left->mcv, right->mcv, left->typinfo->eqFuncOp) ? 0 : 1;
 }

 /*
  * Main function for aggregating leaf partition histogram to compute
  * root or interior partition histogram
  * Input:
  * 	- relationOid: Oid of root or interior partition
  * 	- attnum: column number
  * 	- nEntries: target number of histogram bounds to be collected, the real number of
  * 	histogram bounds returned may be less
  * Output:
  * 	- result: an array of aggregated histogram bounds
  * Algorithm:
  *
  * 	We use the following example to explain how the aggregating algorithm works.

 	Suppose a parent table 'lineitem' has 3 partitions 'lineitem_prt_1', 'lineitem_prt_2',
 	'lineitem_prt_3'. The histograms of the column of interest of the parts are:

 	hist(prt_1): {0,19,38,59}
 	hist(prt_2): {2,18,40,62}
 	hist(prt_3): {1,22,39,61}

 	Note the histograms are equi-depth, which implies each bucket should contain the same number of tuples.

 	The number of tuples in each part is:

 	nTuples(prt_1) = 300
 	nTuples(prt_2) = 270
 	nTuples(prt_3) = 330

 	Some notation:

 	hist(agg): the aggregated histogram
 	hist(parts): the histograms of the partitions, i.e., {hist(prt_1), hist(prt_2), hist(prt_3)}
 	nEntries: the target number of histogram buckets in hist(agg). Usually this is the same as in the partitions. In this example, nEntries = 3.
 	nParts: the number of partitions. nParts = 3 in this example.

 	Since we know the target number of tuples in each bucket of hist(agg), the basic idea is to fill the buckets of hist(agg) using the buckets in hist(parts). And once a bucket in hist(agg) is filled up, we look at which bucket from hist(parts) is the current bucket, and use its bound as the bucket bound in hist(agg).
 	Continue with our example we have,

 	bucketSize(prt_1) = 300/3 = 100
 	bucketSize(prt_2) = 270/3 = 90
 	bucketSize(prt_3) = 330/3 = 110
 	bucketSize(agg) = (300+270+330)/3 = 300

 	Now, to begin with, we find the minimum of the first boundary point across hist(parts) and use it as the first boundary of hist(agg), i.e.,
 	hist(agg) = {min({0,2,1})} = {0}

 	We need to maintain a priority queue in order to decide on the next bucket from hist(parts) to work with.
 	Each element in the queue is a (Datum, partID) pair, where Datum is a boundary from hist(parts) and partID is the ID of the part the Datum comes from.
 	Each time we dequeue(), we get the minimum datum in the queue as the next datum we will work on.
 	The priority queue contains up to nParts entries. In our example, we first enqueue
 	the second boundary across hist(parts), i.e., 19, 18, 22, along with their part ID.

 	Continue with filling the bucket of hist(agg), we dequeue '18' from the queue and fill in
 	the first bucket (having 90 tuples). Since bucketSize(agg) = 300, we need more buckets
 	from hist(parts) to fill it. At the same time, we dequeue 18 and enqueue the next bound (which is 40).
 	The first bucket of hist(agg) will be filled up by '22' (90+100+110 >= 300), at this time we put '22' as the next boundary value in hist(agg), i.e.
 	hist(agg) = {0,22}

 	Continue with the iteration, we will finally fill all the buckets
 	hist(agg) = {0,22,40,62}
  *
  */
 void
 aggregate_leaf_partition_histograms
 	(
 	Oid relationOid,
 	AttrNumber attnum,
 	unsigned int nEntries,
 	ArrayType **result
 	)
 {
 	List *lRelOids = rel_get_leaf_children_relids(relationOid);
 	int nParts = list_length(lRelOids);
 	Assert(nParts > 0);

 	/* get type information */
 	TypInfo typInfo;
 	Oid typOid = get_atttype(relationOid, attnum);
 	initTypInfo(&typInfo, typOid);

 	Datum *histData[nParts]; /* array of nParts histograms, all histogram bounds from all parts are stored here */
 	int nBounds[nParts]; /* the number of histogram bounds for each part */
 	float4 sumReltuples = 0;
 	float4 partsReltuples[nParts]; /* the number of tuples for each part */
 	memset(histData, 0, nParts * sizeof(Datum *));
 	memset(partsReltuples, 0, nParts * sizeof(float4));
 	memset(nBounds, 0, nParts * sizeof(int));

 	int numNotNullParts = 0;
 	/* populate histData, nBounds, partsReltuples and sumReltuples */
 	getHistogramHeapTuple(lRelOids, histData, nBounds, &typInfo, attnum, partsReltuples, &sumReltuples, &numNotNullParts);

 	if (0 == numNotNullParts)
 	{
 		/* if all the parts histograms are empty, we return nothing */
 		result = NULL;
 		return;
 	}

 	/* reset nParts to the number of non-null parts */
 	nParts = numNotNullParts;

 	/* now define the state variables needed for the aggregation loop */
 	float4 bucketSize = sumReltuples / (nEntries + 1); /* target bucket size in the aggregated histogram */
 	float4 nTuplesToFill = bucketSize; /* remaining number of tuples to fill in the current bucket
 									 of the aggregated histogram, reset to bucketSize when a new
 									 bucket is added */
 	int cursors[nParts]; /* the index of current bucket for each histogram, set to -1
 								  after the histogram has been traversed */
 	float4 eachBucket[nParts]; /* the number of data points in each bucket for each histogram */
 	float4 remainingSize[nParts]; /* remaining number of tuples in the current bucket of a part */
 	memset(cursors, 0, nParts * sizeof(int));
 	memset(eachBucket, 0, nParts * sizeof(float4));
 	memset(remainingSize, 0, nParts * sizeof(float4));

 	/* initialize eachBucket[] and remainingSize[] */
 	for (int i = 0; i < nParts; i++)
 	{
 		if (1 < nBounds[i])
 		{
 			eachBucket[i] = partsReltuples[i] / (nBounds[i] - 1);
 			remainingSize[i] = eachBucket[i];
 		}
 	}

 	int pid = 0; /* part id */
 	/* we maintain a priority queue (min heap) of PartDatum */
 	CdbHeap *dhp = CdbHeap_Create(DatumHeapComparator,
 								&typInfo,
 								nParts /* nSlotMax */,
 								sizeof(PartDatum),
 								NULL /* slotArray */);

 	List *ldatum = NIL; /* list of pointers to the selected bounds */
 	/* the first bound in the aggregated histogram will be the minimum of the first bounds of all parts */
 	Datum minBound = getMinBound(histData, cursors, nBounds, nParts, typInfo.ltFuncOp);
 	ldatum = lappend(ldatum, &minBound);

 	/* continue filling the aggregated histogram, starting from the second bound */
 	initDatumHeap(dhp, histData, cursors, nParts);

 	/* loop continues when DatumHeap is not empty yet and the number of histogram boundaries
 	 * has not reached nEntries */
 	while (((pid = getNextPartDatum(dhp)) >= 0) && list_length(ldatum) <= nEntries)
 	{
 		if (remainingSize[pid] < nTuplesToFill)
 		{
 			nTuplesToFill -= remainingSize[pid];
 			advanceCursor(pid, cursors, nBounds);
 			remainingSize[pid] = eachBucket[pid];
 			CdbHeap_DeleteMin(dhp);
 			if (cursors[pid] > 0)
 			{
 				PartDatum pd;
 				pd.partId = pid;
 				pd.datum = histData[pid][cursors[pid]];
 				CdbHeap_Insert(dhp, &pd);
 			}
 		}
 		else
 		{
 			ldatum = lappend(ldatum, &histData[pid][cursors[pid]]);
 			remainingSize[pid] -= nTuplesToFill;
 			nTuplesToFill = bucketSize;
 		}
 	}

 	/* adding the max boundary across all histograms to the aggregated histogram */
 	Datum maxBound = getMaxBound(histData, nBounds, nParts, typInfo.ltFuncOp);
 	ldatum = lappend(ldatum, &maxBound);

 	/* now ldatum contains the resulting boundaries */
 	ArrayType *out = buildHistogramEntryForStats(ldatum, &typInfo);

 	/* clean up */
 	CdbHeap_Destroy(dhp);
 	for (int j = 0; j < nParts; j++)
 	{
 		free_attstatsslot(typOid, histData[j], nBounds[j], NULL, 0);
 	}

 	*result = out;
 }

 /*
  * Obtain all histogram bounds from every partition and store them in a 2D array (histData)
  * Input:
  * 	lRelOids - list of part Oids
  * 	typInfo - type info
  * 	attnum - attribute number
  * Output:
  * 	histData - 2D array of all histogram bounds from every partition
  * 	nBounds - array of the number of histogram bounds (from each partition)
  * 	partsReltuples - array of the number of tuples (from each partition)
  * 	sumReltuples - sum of number of tuples in all partitions
  */
 static void
 getHistogramHeapTuple
 	(
 	List *lRelOids,
 	Datum **histData,
 	int *nBounds,
 	TypInfo *typInfo,
 	AttrNumber attnum,
 	float4 *partsReltuples,
 	float4 *sumReltuples,
 	int *numNotNullParts
 	)
 {
 	int pid = 0;

 	ListCell *le = NULL;
 	foreach (le, lRelOids)
 	{
 		Oid partOid = lfirst_oid(le);
 		float4 nTuples = get_rel_reltuples(partOid);
 		partsReltuples[pid] = nTuples;
 		*sumReltuples += nTuples;
 		HeapTuple heaptupleStats = get_att_stats(partOid, attnum);

 		if (!HeapTupleIsValid(heaptupleStats))
 		{
 			continue;
 		}

 		(void) get_attstatsslot
 				(
 				heaptupleStats,
 				typInfo->typOid,
 				-1,
 				STATISTIC_KIND_HISTOGRAM,
 				InvalidOid,
 				&histData[pid], &nBounds[pid],
 				NULL, /* most common frequencies */
 				NULL  /* number of entries for most common frequencies */
 				);

 		heap_freetuple(heaptupleStats);

 		if (nBounds[pid] > 0)
 		{
 			pid++;
 		}
 	}
 	*numNotNullParts = pid;
 }


 /*
  * Initialize type information
  * Input:
  * 	typOid - Oid of the type
  * Output:
  *  members of typInfo are initialized
  */
 static void
 initTypInfo(TypInfo *typInfo, Oid typOid)
 {
 	typInfo->typOid = typOid;
 	get_typlenbyval(typOid, &typInfo->typlen, &typInfo->typbyval);
 	typInfo->ltFuncOp = ordering_oper_funcid(typOid);
 	typInfo->eqFuncOp = equality_oper_funcid(typOid);
 }

 /*
  * Get the part id of the next PartDatum, which contains the minimum datum value, from the heap
  * Input:
  * 	hp - min heap containing PartDatum
  * Output:
  *  part id of the datum having minimum value in the heap. Return -1 if heap is empty.
  */
 static int
 getNextPartDatum(CdbHeap *hp)
 {
 	if (CdbHeap_Count(hp) > 0)
 	{
 		PartDatum* minElement = CdbHeap_Min(PartDatum, hp);
 		return minElement->partId;
 	}
 	return -1;
 }

 /*
  * Initialize heap by inserting the second histogram bound from each partition histogram.
  * Input:
  * 	hp - heap
  * 	histData - all histogram bounds from each part
  * 	cursors - cursor vector
  * 	nParts - number of partitions
  */
 static void
 initDatumHeap(CdbHeap *hp, Datum **histData, int *cursors, int nParts)
 {
 	for (int pid = 0; pid < nParts; pid++)
 	{
 		if (cursors[pid] > 0) /* do nothing if part histogram only has one element */
 		{
 			PartDatum pd;
 			pd.partId = pid;
 			pd.datum = histData[pid][cursors[pid]];
 			CdbHeap_Insert(hp, &pd);
 		}
 	}
 }

 /*
  * Comparator function of heap element PartDatum
  * Input:
  * 	lhs, rhs - pointers to heap elements
  * 	context - pointer to comparison context
  * Output:
  *  -1 if lhs < rhs
  *  0 if lhs == rhs
  *  1 if lhs > rhs
  */
 static int
 DatumHeapComparator(void *lhs, void *rhs, void *context)
 {
 	Datum d1 = ((PartDatum *)lhs)->datum;
 	Datum d2 = ((PartDatum *)rhs)->datum;
 	TypInfo *typInfo = (TypInfo *) context;

 	if (datumCompare(d1, d2, typInfo->ltFuncOp))
 	{
 		return -1;
 	}

 	if (datumCompare(d1, d2, typInfo->eqFuncOp))
 	{
 		return 0;
 	}

 	return 1;
 }

 /* Advance the cursor of a partition by 1, set to -1 if the end is reached
  * Input:
  * 	pid - partition id
  * 	cursors - cursor vector
  * 	nBounds - array of the number of bounds
  * */
 static void
 advanceCursor(int pid, int *cursors, int *nBounds)
 {
 	cursors[pid]++;
 	if (cursors[pid] >= nBounds[pid])
 	{
 		cursors[pid] = -1;
 	}
 }

 /*
  * Get the minimum bound of all partition bounds. Only need to iterate over
  * the first bound of each partition since the bounds in a histogram are ordered.
  */
 static Datum
 getMinBound(Datum **histData, int *cursors, int *nBounds, int nParts, Oid ltFuncOid)
 {
 	Assert(histData);
 	Assert(histData[0]);
 	Assert(cursors);
 	Assert(nParts > 0);

 	Datum minDatum = histData[0][0];
 	for (int pid = 0; pid < nParts; pid++)
 	{
 		if (datumCompare(histData[pid][0], minDatum, ltFuncOid))
 		{
 			minDatum = histData[pid][0];
 		}
 		advanceCursor(pid, cursors, nBounds);
 	}

 	return minDatum;
 }

 /*
  * Get the maximum bound of all partition bounds. Only need to iterate over
  * the last bound of each partition since the bounds in a histogram are ordered.
  */
 static Datum
 getMaxBound(Datum **histData, int *nBounds, int nParts, Oid ltFuncOid)
 {
 	Assert(histData);
 	Assert(histData[0]);
 	Assert(nParts > 0);

 	Datum maxDatum = histData[0][nBounds[0]-1];
 	for (int pid = 0; pid < nParts; pid++)
 	{
 		if (datumCompare(maxDatum, histData[pid][nBounds[pid]-1], ltFuncOid))
 		{
 			maxDatum = histData[pid][nBounds[pid]-1];
 		}
 	}

 	return maxDatum;
 }

 /*
  * Preparing the output array of histogram bounds, removing any duplicates
  * Input:
  * 	ldatum - list of pointers to the aggregated bounds, may contain duplicates
  * 	typInfo - type information
  * Output:
  *  an array containing the aggregated histogram bounds
  */
 static ArrayType *
 buildHistogramEntryForStats
 	(
 	List *ldatum,
 	TypInfo* typInfo
 	)
 {

 	Assert(ldatum);
 	Assert(typInfo);

 	ArrayType *histArray = NULL;
 	ArrayBuildState *astate = NULL;

 	ListCell *lc = NULL;
 	Datum *prevDatum = (Datum *) linitial(ldatum);
 	int idx = 0;

 	foreach_with_count (lc, ldatum, idx)
 	{
 		Datum *pdatum = (Datum *) lfirst(lc);

 		/* remove duplicate datum in the list, starting from the second datum */
 		if (datumCompare(*pdatum, *prevDatum, typInfo->eqFuncOp) && idx > 0)
 		{
 			continue;
 		}

 		astate = accumArrayResult(astate, *pdatum, false, typInfo->typOid, CurrentMemoryContext);
 		*prevDatum = *pdatum;
 	}

 	if (astate)
 	{
 		histArray = DatumGetArrayTypeP(makeArrayResult(astate, CurrentMemoryContext));
 	}
 	return histArray;
 }

 /*
  * Comparison function for two datums
  * Input:
  * 	d1, d2 - datums
  * 	opFuncOid - oid of the function for comparison operator of this datum type
  */
 bool
 datumCompare(Datum d1, Datum d2, Oid opFuncOid)
 {
 	FmgrInfo	ltproc;
 	fmgr_info(opFuncOid, &ltproc);
 	return DatumGetBool(FunctionCall2(&ltproc, d1, d2));
 }