Add missing intarray files.

2025-12-18 05:01:01 +03:00 · 2003-06-11 19:31:05 +00:00
parent a24c5a7b12
commit a237dd2b30
6 changed files with 2750 additions and 0 deletions
--- a/contrib/intarray/_int_gist.c
+++ b/contrib/intarray/_int_gist.c
@@ -0,0 +1,504 @@
+#include "_int.h"
+
+#define GETENTRY(vec,pos) ((ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(vec))[(pos)].key))
+
+/*
+** GiST support methods
+*/
+PG_FUNCTION_INFO_V1(g_int_consistent);
+PG_FUNCTION_INFO_V1(g_int_compress);
+PG_FUNCTION_INFO_V1(g_int_decompress);
+PG_FUNCTION_INFO_V1(g_int_penalty);
+PG_FUNCTION_INFO_V1(g_int_picksplit);
+PG_FUNCTION_INFO_V1(g_int_union);
+PG_FUNCTION_INFO_V1(g_int_same);
+
+Datum		g_int_consistent(PG_FUNCTION_ARGS);
+Datum		g_int_compress(PG_FUNCTION_ARGS);
+Datum		g_int_decompress(PG_FUNCTION_ARGS);
+Datum		g_int_penalty(PG_FUNCTION_ARGS);
+Datum		g_int_picksplit(PG_FUNCTION_ARGS);
+Datum		g_int_union(PG_FUNCTION_ARGS);
+Datum		g_int_same(PG_FUNCTION_ARGS);
+
+
+/*
+** The GiST Consistent method for _intments
+** Should return false if for all data items x below entry,
+** the predicate x op query == FALSE, where op is the oper
+** corresponding to strategy in the pg_amop table.
+*/
+Datum
+g_int_consistent(PG_FUNCTION_ARGS)
+{
+	GISTENTRY  *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
+	ArrayType  *query = (ArrayType *) PG_GETARG_POINTER(1);
+	StrategyNumber strategy = (StrategyNumber) PG_GETARG_UINT16(2);
+	bool		retval;
+
+	if (strategy == BooleanSearchStrategy)
+		PG_RETURN_BOOL(execconsistent((QUERYTYPE *) query,
+							   (ArrayType *) DatumGetPointer(entry->key),
+				  ISLEAFKEY((ArrayType *) DatumGetPointer(entry->key))));
+
+	/* XXX are we sure it's safe to scribble on the query object here? */
+	/* XXX what about toasted input? */
+	/* sort query for fast search, key is already sorted */
+	if (ARRISVOID(query))
+		PG_RETURN_BOOL(false);
+	PREPAREARR(query);
+
+	switch (strategy)
+	{
+		case RTOverlapStrategyNumber:
+			retval = inner_int_overlap((ArrayType *) DatumGetPointer(entry->key),
+									   query);
+			break;
+		case RTSameStrategyNumber:
+			if (GIST_LEAF(entry))
+				DirectFunctionCall3(
+									g_int_same,
+									entry->key,
+									PointerGetDatum(query),
+									PointerGetDatum(&retval)
+					);
+			else
+				retval = inner_int_contains((ArrayType *) DatumGetPointer(entry->key),
+											query);
+			break;
+		case RTContainsStrategyNumber:
+			retval = inner_int_contains((ArrayType *) DatumGetPointer(entry->key),
+										query);
+			break;
+		case RTContainedByStrategyNumber:
+			if (GIST_LEAF(entry))
+				retval = inner_int_contains(query,
+							  (ArrayType *) DatumGetPointer(entry->key));
+			else
+				retval = inner_int_overlap((ArrayType *) DatumGetPointer(entry->key),
+										   query);
+			break;
+		default:
+			retval = FALSE;
+	}
+	PG_RETURN_BOOL(retval);
+}
+
+Datum
+g_int_union(PG_FUNCTION_ARGS) {
+	bytea      *entryvec = (bytea *) PG_GETARG_POINTER(0);
+	int                *size = (int *) PG_GETARG_POINTER(1);
+	int4            i,len = (VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY);
+	ArrayType	*res;
+	int totlen=0,*ptr;
+
+	for (i = 0; i < len; i++)
+		totlen+=ARRNELEMS( GETENTRY(entryvec,i) );
+
+	res=new_intArrayType(totlen);
+	ptr=ARRPTR(res);
+
+	for (i = 0; i < len; i++) {
+		memcpy(ptr, ARRPTR( GETENTRY(entryvec,i) ), ARRNELEMS( GETENTRY(entryvec,i) )*sizeof(int4) );
+		ptr+=ARRNELEMS( GETENTRY(entryvec,i) );
+	}
+
+	QSORT(res,1);
+	res=_int_unique(res);
+	*size = VARSIZE(res);	
+	PG_RETURN_POINTER(res);
+}
+
+/*
+** GiST Compress and Decompress methods
+*/
+Datum
+g_int_compress(PG_FUNCTION_ARGS)
+{
+	GISTENTRY  *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
+	GISTENTRY  *retval;
+	ArrayType  *r;
+	int			len;
+	int		   *dr;
+	int			i,
+				min,
+				cand;
+
+	if (entry->leafkey)
+	{
+		r = (ArrayType *) PG_DETOAST_DATUM_COPY(entry->key);
+		PREPAREARR(r);
+		r->flags |= LEAFKEY;
+		retval = palloc(sizeof(GISTENTRY));
+		gistentryinit(*retval, PointerGetDatum(r),
+			  entry->rel, entry->page, entry->offset, VARSIZE(r), FALSE);
+
+		PG_RETURN_POINTER(retval);
+	}
+
+	r = (ArrayType *) PG_DETOAST_DATUM(entry->key);
+	if (ISLEAFKEY(r) || ARRISVOID(r))
+	{
+		if (r != (ArrayType *) DatumGetPointer(entry->key))
+			pfree(r);
+		PG_RETURN_POINTER(entry);
+	}
+
+	if ((len = ARRNELEMS(r)) >= 2 * MAXNUMRANGE)
+	{							/* compress */
+		if (r == (ArrayType *) DatumGetPointer(entry->key))
+			r = (ArrayType *) PG_DETOAST_DATUM_COPY(entry->key);
+		r = resize_intArrayType(r, 2 * (len));
+
+		dr = ARRPTR(r);
+
+		for (i = len - 1; i >= 0; i--)
+			dr[2 * i] = dr[2 * i + 1] = dr[i];
+
+		len *= 2;
+		cand = 1;
+		while (len > MAXNUMRANGE * 2)
+		{
+			min = 0x7fffffff;
+			for (i = 2; i < len; i += 2)
+				if (min > (dr[i] - dr[i - 1]))
+				{
+					min = (dr[i] - dr[i - 1]);
+					cand = i;
+				}
+			memmove((void *) &dr[cand - 1], (void *) &dr[cand + 1], (len - cand - 1) * sizeof(int));
+			len -= 2;
+		}
+		r = resize_intArrayType(r, len);
+		retval = palloc(sizeof(GISTENTRY));
+		gistentryinit(*retval, PointerGetDatum(r),
+			  entry->rel, entry->page, entry->offset, VARSIZE(r), FALSE);
+		PG_RETURN_POINTER(retval);
+	}
+	else
+		PG_RETURN_POINTER(entry);
+
+	PG_RETURN_POINTER(entry);
+}
+
+Datum
+g_int_decompress(PG_FUNCTION_ARGS)
+{
+	GISTENTRY  *entry = (GISTENTRY *) PG_GETARG_POINTER(0);
+	GISTENTRY  *retval;
+	ArrayType  *r;
+	int		   *dr,
+				lenr;
+	ArrayType  *in;
+	int			lenin;
+	int		   *din;
+	int			i,
+				j;
+
+	in = (ArrayType *) PG_DETOAST_DATUM(entry->key);
+
+	if (ARRISVOID(in))
+		PG_RETURN_POINTER(entry);
+
+	lenin = ARRNELEMS(in);
+
+	if (lenin < 2 * MAXNUMRANGE || ISLEAFKEY(in))
+	{							/* not compressed value */
+		if (in != (ArrayType *) DatumGetPointer(entry->key))
+		{
+			retval = palloc(sizeof(GISTENTRY));
+			gistentryinit(*retval, PointerGetDatum(in),
+			 entry->rel, entry->page, entry->offset, VARSIZE(in), FALSE);
+
+			PG_RETURN_POINTER(retval);
+		}
+		PG_RETURN_POINTER(entry);
+	}
+
+	din = ARRPTR(in);
+	lenr = internal_size(din, lenin);
+
+	r = new_intArrayType(lenr);
+	dr = ARRPTR(r);
+
+	for (i = 0; i < lenin; i += 2)
+		for (j = din[i]; j <= din[i + 1]; j++)
+			if ((!i) || *(dr - 1) != j)
+				*dr++ = j;
+
+	if (in != (ArrayType *) DatumGetPointer(entry->key))
+		pfree(in);
+	retval = palloc(sizeof(GISTENTRY));
+	gistentryinit(*retval, PointerGetDatum(r),
+			  entry->rel, entry->page, entry->offset, VARSIZE(r), FALSE);
+
+	PG_RETURN_POINTER(retval);
+}
+
+/*
+** The GiST Penalty method for _intments
+*/
+Datum
+g_int_penalty(PG_FUNCTION_ARGS) {
+	GISTENTRY *origentry = (GISTENTRY *) PG_GETARG_POINTER(0);
+	GISTENTRY *newentry  = (GISTENTRY *) PG_GETARG_POINTER(1);
+	float *result = (float *) PG_GETARG_POINTER(2);
+	ArrayType  *ud;
+	float		tmp1,
+				tmp2;
+
+	ud = inner_int_union((ArrayType *) DatumGetPointer(origentry->key),
+					(ArrayType *) DatumGetPointer(newentry->key));
+	rt__int_size(ud, &tmp1);
+	rt__int_size((ArrayType *) DatumGetPointer(origentry->key), &tmp2);
+	*result = tmp1 - tmp2;
+	pfree(ud);
+
+	PG_RETURN_POINTER (result);
+}
+
+
+
+Datum
+g_int_same(PG_FUNCTION_ARGS)
+{
+	ArrayType  *a = (ArrayType *) PointerGetDatum(PG_GETARG_POINTER(0));
+	ArrayType  *b = (ArrayType *) PointerGetDatum(PG_GETARG_POINTER(1));
+	bool	   *result = (bool *) PG_GETARG_POINTER(2);
+	int4		n = ARRNELEMS(a);
+	int4	   *da,
+			   *db;
+
+	if (n != ARRNELEMS(b))
+	{
+		*result = false;
+		PG_RETURN_POINTER(result);
+	}
+	*result = TRUE;
+	da = ARRPTR(a);
+	db = ARRPTR(b);
+	while (n--)
+		if (*da++ != *db++)
+		{
+			*result = FALSE;
+			break;
+		}
+
+	PG_RETURN_POINTER(result);
+}
+
+/*****************************************************************
+** Common GiST Method
+*****************************************************************/
+
+typedef struct
+{
+	OffsetNumber pos;
+	float		cost;
+} SPLITCOST;
+
+static int
+comparecost(const void *a, const void *b)
+{
+	if (((SPLITCOST *) a)->cost == ((SPLITCOST *) b)->cost)
+		return 0;
+	else
+		return (((SPLITCOST *) a)->cost > ((SPLITCOST *) b)->cost) ? 1 : -1;
+}
+
+/*
+** The GiST PickSplit method for _intments
+** We use Guttman's poly time split algorithm
+*/
+Datum
+g_int_picksplit(PG_FUNCTION_ARGS) {
+	bytea *entryvec = (bytea *) PG_GETARG_POINTER(0);
+	GIST_SPLITVEC *v = (GIST_SPLITVEC *) PG_GETARG_POINTER(1);
+	OffsetNumber i,
+				j;
+	ArrayType  *datum_alpha,
+			   *datum_beta;
+	ArrayType  *datum_l,
+			   *datum_r;
+	ArrayType  *union_d,
+			   *union_dl,
+			   *union_dr;
+	ArrayType  *inter_d;
+	bool		firsttime;
+	float		size_alpha,
+				size_beta,
+				size_union,
+				size_inter;
+	float		size_waste,
+				waste;
+	float		size_l,
+				size_r;
+	int			nbytes;
+	OffsetNumber seed_1 = 0,
+				seed_2 = 0;
+	OffsetNumber *left,
+			   *right;
+	OffsetNumber maxoff;
+	SPLITCOST  *costvector;
+
+#ifdef GIST_DEBUG
+	elog(DEBUG3, "--------picksplit %d", (VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY));
+#endif
+
+	maxoff = ((VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY)) - 2;
+	nbytes = (maxoff + 2) * sizeof(OffsetNumber);
+	v->spl_left = (OffsetNumber *) palloc(nbytes);
+	v->spl_right = (OffsetNumber *) palloc(nbytes);
+
+	firsttime = true;
+	waste = 0.0;
+	for (i = FirstOffsetNumber; i < maxoff; i = OffsetNumberNext(i))
+	{
+		datum_alpha = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[i].key);
+		for (j = OffsetNumberNext(i); j <= maxoff; j = OffsetNumberNext(j))
+		{
+			datum_beta = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[j].key);
+
+			/* compute the wasted space by unioning these guys */
+			/* size_waste = size_union - size_inter; */
+			union_d = inner_int_union(datum_alpha, datum_beta);
+			rt__int_size(union_d, &size_union);
+			inter_d = inner_int_inter(datum_alpha, datum_beta);
+			rt__int_size(inter_d, &size_inter);
+			size_waste = size_union - size_inter;
+
+			pfree(union_d);
+
+			if (inter_d != (ArrayType *) NULL)
+				pfree(inter_d);
+
+			/*
+			 * are these a more promising split that what we've already
+			 * seen?
+			 */
+
+			if (size_waste > waste || firsttime)
+			{
+				waste = size_waste;
+				seed_1 = i;
+				seed_2 = j;
+				firsttime = false;
+			}
+		}
+	}
+
+	left = v->spl_left;
+	v->spl_nleft = 0;
+	right = v->spl_right;
+	v->spl_nright = 0;
+	if (seed_1 == 0 || seed_2 == 0)
+	{
+		seed_1 = 1;
+		seed_2 = 2;
+	}
+
+	datum_alpha = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[seed_1].key);
+	datum_l = copy_intArrayType(datum_alpha);
+	rt__int_size(datum_l, &size_l);
+	datum_beta = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[seed_2].key);
+	datum_r = copy_intArrayType(datum_beta);
+	rt__int_size(datum_r, &size_r);
+
+	maxoff = OffsetNumberNext(maxoff);
+
+	/*
+	 * sort entries
+	 */
+	costvector = (SPLITCOST *) palloc(sizeof(SPLITCOST) * maxoff);
+	for (i = FirstOffsetNumber; i <= maxoff; i = OffsetNumberNext(i))
+	{
+		costvector[i - 1].pos = i;
+		datum_alpha = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[i].key);
+		union_d = inner_int_union(datum_l, datum_alpha);
+		rt__int_size(union_d, &size_alpha);
+		pfree(union_d);
+		union_d = inner_int_union(datum_r, datum_alpha);
+		rt__int_size(union_d, &size_beta);
+		pfree(union_d);
+		costvector[i - 1].cost = abs((size_alpha - size_l) - (size_beta - size_r));
+	}
+	qsort((void *) costvector, maxoff, sizeof(SPLITCOST), comparecost);
+
+	/*
+	 * Now split up the regions between the two seeds.	An important
+	 * property of this split algorithm is that the split vector v has the
+	 * indices of items to be split in order in its left and right
+	 * vectors.  We exploit this property by doing a merge in the code
+	 * that actually splits the page.
+	 *
+	 * For efficiency, we also place the new index tuple in this loop. This
+	 * is handled at the very end, when we have placed all the existing
+	 * tuples and i == maxoff + 1.
+	 */
+
+
+	for (j = 0; j < maxoff; j++)
+	{
+		i = costvector[j].pos;
+
+		/*
+		 * If we've already decided where to place this item, just put it
+		 * on the right list.  Otherwise, we need to figure out which page
+		 * needs the least enlargement in order to store the item.
+		 */
+
+		if (i == seed_1)
+		{
+			*left++ = i;
+			v->spl_nleft++;
+			continue;
+		}
+		else if (i == seed_2)
+		{
+			*right++ = i;
+			v->spl_nright++;
+			continue;
+		}
+
+		/* okay, which page needs least enlargement? */
+		datum_alpha = (ArrayType *) DatumGetPointer(((GISTENTRY *) VARDATA(entryvec))[i].key);
+		union_dl = inner_int_union(datum_l, datum_alpha);
+		union_dr = inner_int_union(datum_r, datum_alpha);
+		rt__int_size(union_dl, &size_alpha);
+		rt__int_size(union_dr, &size_beta);
+
+		/* pick which page to add it to */
+		if (size_alpha - size_l < size_beta - size_r + WISH_F(v->spl_nleft, v->spl_nright, 0.01))
+		{
+			if (datum_l)
+				pfree(datum_l);
+			if (union_dr)
+				pfree(union_dr);
+			datum_l = union_dl;
+			size_l = size_alpha;
+			*left++ = i;
+			v->spl_nleft++;
+		}
+		else
+		{
+			if (datum_r)
+				pfree(datum_r);
+			if (union_dl)
+				pfree(union_dl);
+			datum_r = union_dr;
+			size_r = size_beta;
+			*right++ = i;
+			v->spl_nright++;
+		}
+	}
+	pfree(costvector);
+	*right = *left = FirstOffsetNumber;
+
+	datum_l->flags &= ~LEAFKEY;
+	datum_r->flags &= ~LEAFKEY;
+	v->spl_ldatum = PointerGetDatum(datum_l);
+	v->spl_rdatum = PointerGetDatum(datum_r);
+
+	PG_RETURN_POINTER(v);
+}
+