mirror of
				https://github.com/postgres/postgres.git
				synced 2025-10-25 13:17:41 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			1133 lines
		
	
	
		
			23 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			1133 lines
		
	
	
		
			23 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /******************************************************************************
 | |
|   This file contains routines that can be bound to a Postgres backend and
 | |
|   called by the backend in the process of processing queries.  The calling
 | |
|   format for these routines is dictated by Postgres architecture.
 | |
| ******************************************************************************/
 | |
| 
 | |
| #include "postgres.h"
 | |
| 
 | |
| #include <float.h>
 | |
| 
 | |
| #include "access/gist.h"
 | |
| #include "access/rtree.h"
 | |
| #include "utils/elog.h"
 | |
| #include "utils/palloc.h"
 | |
| #include "utils/builtins.h"
 | |
| 
 | |
| #include "segdata.h"
 | |
| 
 | |
| #define max(a,b)		((a) >	(b) ? (a) : (b))
 | |
| #define min(a,b)		((a) <= (b) ? (a) : (b))
 | |
| #define abs(a)			((a) <	(0) ? (-a) : (a))
 | |
| 
 | |
| /*
 | |
| #define GIST_DEBUG
 | |
| #define GIST_QUERY_DEBUG
 | |
| */
 | |
| 
 | |
| extern void set_parse_buffer(char *str);
 | |
| extern int	seg_yyparse();
 | |
| 
 | |
| /*
 | |
| extern int	 seg_yydebug;
 | |
| */
 | |
| 
 | |
| /*
 | |
| ** Input/Output routines
 | |
| */
 | |
| SEG		   *seg_in(char *str);
 | |
| char	   *seg_out(SEG * seg);
 | |
| float32		seg_lower(SEG * seg);
 | |
| float32		seg_upper(SEG * seg);
 | |
| float32		seg_center(SEG * seg);
 | |
| 
 | |
| /*
 | |
| ** GiST support methods
 | |
| */
 | |
| bool		gseg_consistent(GISTENTRY *entry, SEG * query, StrategyNumber strategy);
 | |
| GISTENTRY  *gseg_compress(GISTENTRY *entry);
 | |
| GISTENTRY  *gseg_decompress(GISTENTRY *entry);
 | |
| float	   *gseg_penalty(GISTENTRY *origentry, GISTENTRY *newentry, float *result);
 | |
| GIST_SPLITVEC *gseg_picksplit(bytea *entryvec, GIST_SPLITVEC *v);
 | |
| bool		gseg_leaf_consistent(SEG * key, SEG * query, StrategyNumber strategy);
 | |
| bool		gseg_internal_consistent(SEG * key, SEG * query, StrategyNumber strategy);
 | |
| SEG		   *gseg_union(bytea *entryvec, int *sizep);
 | |
| SEG		   *gseg_binary_union(SEG * r1, SEG * r2, int *sizep);
 | |
| bool	   *gseg_same(SEG * b1, SEG * b2, bool *result);
 | |
| 
 | |
| 
 | |
| /*
 | |
| ** R-tree suport functions
 | |
| */
 | |
| bool		seg_same(SEG * a, SEG * b);
 | |
| bool		seg_contains_int(SEG * a, int *b);
 | |
| bool		seg_contains_float4(SEG * a, float4 *b);
 | |
| bool		seg_contains_float8(SEG * a, float8 *b);
 | |
| bool		seg_contains(SEG * a, SEG * b);
 | |
| bool		seg_contained(SEG * a, SEG * b);
 | |
| bool		seg_overlap(SEG * a, SEG * b);
 | |
| bool		seg_left(SEG * a, SEG * b);
 | |
| bool		seg_over_left(SEG * a, SEG * b);
 | |
| bool		seg_right(SEG * a, SEG * b);
 | |
| bool		seg_over_right(SEG * a, SEG * b);
 | |
| SEG		   *seg_union(SEG * a, SEG * b);
 | |
| SEG		   *seg_inter(SEG * a, SEG * b);
 | |
| void		rt_seg_size(SEG * a, float *sz);
 | |
| float	   *seg_size(SEG * a);
 | |
| 
 | |
| /*
 | |
| ** Various operators
 | |
| */
 | |
| int32		seg_cmp(SEG * a, SEG * b);
 | |
| bool		seg_lt(SEG * a, SEG * b);
 | |
| bool		seg_le(SEG * a, SEG * b);
 | |
| bool		seg_gt(SEG * a, SEG * b);
 | |
| bool		seg_ge(SEG * a, SEG * b);
 | |
| bool		seg_different(SEG * a, SEG * b);
 | |
| 
 | |
| /*
 | |
| ** Auxiliary funxtions
 | |
| */
 | |
| static int	restore(char *s, float val, int n);
 | |
| int			significant_digits(char *s);
 | |
| 
 | |
| 
 | |
| /*****************************************************************************
 | |
|  * Input/Output functions
 | |
|  *****************************************************************************/
 | |
| 
 | |
| SEG *
 | |
| seg_in(char *str)
 | |
| {
 | |
| 	SEG		   *result = palloc(sizeof(SEG));
 | |
| 
 | |
| 	set_parse_buffer(str);
 | |
| 
 | |
| 	/*
 | |
| 	 * seg_yydebug = 1;
 | |
| 	 */
 | |
| 	if (seg_yyparse(result) != 0)
 | |
| 	{
 | |
| 		pfree(result);
 | |
| 		return NULL;
 | |
| 	}
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * You might have noticed a slight inconsistency between the following
 | |
|  * declaration and the SQL definition:
 | |
|  *	   CREATE FUNCTION seg_out(opaque) RETURNS opaque ...
 | |
|  * The reason is that the argument passed into seg_out is really just a
 | |
|  * pointer. POSTGRES thinks all output functions are:
 | |
|  *	   char *out_func(char *);
 | |
|  */
 | |
| char *
 | |
| seg_out(SEG * seg)
 | |
| {
 | |
| 	char	   *result;
 | |
| 	char	   *p;
 | |
| 
 | |
| 	if (seg == NULL)
 | |
| 		return (NULL);
 | |
| 
 | |
| 	p = result = (char *) palloc(40);
 | |
| 
 | |
| 	if (seg->l_ext == '>' || seg->l_ext == '<' || seg->l_ext == '~')
 | |
| 		p += sprintf(p, "%c", seg->l_ext);
 | |
| 
 | |
| 	if (seg->lower == seg->upper && seg->l_ext == seg->u_ext)
 | |
| 	{
 | |
| 
 | |
| 		/*
 | |
| 		 * indicates that this interval was built by seg_in off a single
 | |
| 		 * point
 | |
| 		 */
 | |
| 		p += restore(p, seg->lower, seg->l_sigd);
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		if (seg->l_ext != '-')
 | |
| 		{
 | |
| 			/* print the lower boudary if exists */
 | |
| 			p += restore(p, seg->lower, seg->l_sigd);
 | |
| 			p += sprintf(p, " ");
 | |
| 		}
 | |
| 		p += sprintf(p, "..");
 | |
| 		if (seg->u_ext != '-')
 | |
| 		{
 | |
| 			/* print the upper boudary if exists */
 | |
| 			p += sprintf(p, " ");
 | |
| 			if (seg->u_ext == '>' || seg->u_ext == '<' || seg->l_ext == '~')
 | |
| 				p += sprintf(p, "%c", seg->u_ext);
 | |
| 			p += restore(p, seg->upper, seg->u_sigd);
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| float32
 | |
| seg_center(SEG * seg)
 | |
| {
 | |
| 	float32		result = (float32) palloc(sizeof(float32data));
 | |
| 
 | |
| 	if (!seg)
 | |
| 		return (float32) NULL;
 | |
| 
 | |
| 	*result = ((float) seg->lower + (float) seg->upper) / 2.0;
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| float32
 | |
| seg_lower(SEG * seg)
 | |
| {
 | |
| 	float32		result = (float32) palloc(sizeof(float32data));
 | |
| 
 | |
| 	if (!seg)
 | |
| 		return (float32) NULL;
 | |
| 
 | |
| 	*result = (float) seg->lower;
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| float32
 | |
| seg_upper(SEG * seg)
 | |
| {
 | |
| 	float32		result = (float32) palloc(sizeof(float32data));
 | |
| 
 | |
| 	if (!seg)
 | |
| 		return (float32) NULL;
 | |
| 
 | |
| 	*result = (float) seg->upper;
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*****************************************************************************
 | |
|  *						   GiST functions
 | |
|  *****************************************************************************/
 | |
| 
 | |
| /*
 | |
| ** The GiST Consistent method for segments
 | |
| ** Should return false if for all data items x below entry,
 | |
| ** the predicate x op query == FALSE, where op is the oper
 | |
| ** corresponding to strategy in the pg_amop table.
 | |
| */
 | |
| bool
 | |
| gseg_consistent(GISTENTRY *entry,
 | |
| 				SEG * query,
 | |
| 				StrategyNumber strategy)
 | |
| {
 | |
| 
 | |
| 	/*
 | |
| 	 * * if entry is not leaf, use gseg_internal_consistent, * else use
 | |
| 	 * gseg_leaf_consistent
 | |
| 	 */
 | |
| 	if (GIST_LEAF(entry))
 | |
| 		return (gseg_leaf_consistent((SEG *) (entry->pred), query, strategy));
 | |
| 	else
 | |
| 		return (gseg_internal_consistent((SEG *) (entry->pred), query, strategy));
 | |
| }
 | |
| 
 | |
| /*
 | |
| ** The GiST Union method for segments
 | |
| ** returns the minimal bounding seg that encloses all the entries in entryvec
 | |
| */
 | |
| SEG *
 | |
| gseg_union(bytea *entryvec, int *sizep)
 | |
| {
 | |
| 	int			numranges,
 | |
| 				i;
 | |
| 	SEG		   *out = (SEG *) NULL;
 | |
| 	SEG		   *tmp;
 | |
| 
 | |
| #ifdef GIST_DEBUG
 | |
| 	fprintf(stderr, "union\n");
 | |
| #endif
 | |
| 
 | |
| 	numranges = (VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY);
 | |
| 	tmp = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[0]).pred;
 | |
| 	*sizep = sizeof(SEG);
 | |
| 
 | |
| 	for (i = 1; i < numranges; i++)
 | |
| 	{
 | |
| 		out = gseg_binary_union(tmp, (SEG *)
 | |
| 						   (((GISTENTRY *) (VARDATA(entryvec)))[i]).pred,
 | |
| 								sizep);
 | |
| #ifdef GIST_DEBUG
 | |
| 
 | |
| 		/*
 | |
| 		 * fprintf(stderr, "\t%s ^ %s -> %s\n", seg_out(tmp), seg_out((SEG
 | |
| 		 * *)(((GISTENTRY *)(VARDATA(entryvec)))[i]).pred), seg_out(out));
 | |
| 		 */
 | |
| #endif
 | |
| 
 | |
| 		if (i > 1)
 | |
| 			pfree(tmp);
 | |
| 		tmp = out;
 | |
| 	}
 | |
| 
 | |
| 	return (out);
 | |
| }
 | |
| 
 | |
| /*
 | |
| ** GiST Compress and Decompress methods for segments
 | |
| ** do not do anything.
 | |
| */
 | |
| GISTENTRY  *
 | |
| gseg_compress(GISTENTRY *entry)
 | |
| {
 | |
| 	return (entry);
 | |
| }
 | |
| 
 | |
| GISTENTRY  *
 | |
| gseg_decompress(GISTENTRY *entry)
 | |
| {
 | |
| 	return (entry);
 | |
| }
 | |
| 
 | |
| /*
 | |
| ** The GiST Penalty method for segments
 | |
| ** As in the R-tree paper, we use change in area as our penalty metric
 | |
| */
 | |
| float *
 | |
| gseg_penalty(GISTENTRY *origentry, GISTENTRY *newentry, float *result)
 | |
| {
 | |
| 	Datum		ud;
 | |
| 	float		tmp1,
 | |
| 				tmp2;
 | |
| 
 | |
| 	ud = (Datum) seg_union((SEG *) (origentry->pred), (SEG *) (newentry->pred));
 | |
| 	rt_seg_size((SEG *) ud, &tmp1);
 | |
| 	rt_seg_size((SEG *) (origentry->pred), &tmp2);
 | |
| 	*result = tmp1 - tmp2;
 | |
| 	pfree((char *) ud);
 | |
| 
 | |
| #ifdef GIST_DEBUG
 | |
| 	fprintf(stderr, "penalty\n");
 | |
| 	fprintf(stderr, "\t%g\n", *result);
 | |
| #endif
 | |
| 
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| /*
 | |
| ** The GiST PickSplit method for segments
 | |
| ** We use Guttman's poly time split algorithm
 | |
| */
 | |
| GIST_SPLITVEC *
 | |
| gseg_picksplit(bytea *entryvec,
 | |
| 			   GIST_SPLITVEC *v)
 | |
| {
 | |
| 	OffsetNumber i,
 | |
| 				j;
 | |
| 	SEG		   *datum_alpha,
 | |
| 			   *datum_beta;
 | |
| 	SEG		   *datum_l,
 | |
| 			   *datum_r;
 | |
| 	SEG		   *union_d,
 | |
| 			   *union_dl,
 | |
| 			   *union_dr;
 | |
| 	SEG		   *inter_d;
 | |
| 	bool		firsttime;
 | |
| 	float		size_alpha,
 | |
| 				size_beta,
 | |
| 				size_union,
 | |
| 				size_inter;
 | |
| 	float		size_waste,
 | |
| 				waste;
 | |
| 	float		size_l,
 | |
| 				size_r;
 | |
| 	int			nbytes;
 | |
| 	OffsetNumber seed_1 = 0,
 | |
| 				seed_2 = 0;
 | |
| 	OffsetNumber *left,
 | |
| 			   *right;
 | |
| 	OffsetNumber maxoff;
 | |
| 
 | |
| #ifdef GIST_DEBUG
 | |
| 	fprintf(stderr, "picksplit\n");
 | |
| #endif
 | |
| 
 | |
| 	maxoff = ((VARSIZE(entryvec) - VARHDRSZ) / sizeof(GISTENTRY)) - 2;
 | |
| 	nbytes = (maxoff + 2) * sizeof(OffsetNumber);
 | |
| 	v->spl_left = (OffsetNumber *) palloc(nbytes);
 | |
| 	v->spl_right = (OffsetNumber *) palloc(nbytes);
 | |
| 
 | |
| 	firsttime = true;
 | |
| 	waste = 0.0;
 | |
| 
 | |
| 	for (i = FirstOffsetNumber; i < maxoff; i = OffsetNumberNext(i))
 | |
| 	{
 | |
| 		datum_alpha = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[i].pred);
 | |
| 		for (j = OffsetNumberNext(i); j <= maxoff; j = OffsetNumberNext(j))
 | |
| 		{
 | |
| 			datum_beta = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[j].pred);
 | |
| 
 | |
| 			/* compute the wasted space by unioning these guys */
 | |
| 			/* size_waste = size_union - size_inter; */
 | |
| 			union_d = (SEG *) seg_union(datum_alpha, datum_beta);
 | |
| 			rt_seg_size(union_d, &size_union);
 | |
| 			inter_d = (SEG *) seg_inter(datum_alpha, datum_beta);
 | |
| 			rt_seg_size(inter_d, &size_inter);
 | |
| 			size_waste = size_union - size_inter;
 | |
| 
 | |
| 			pfree(union_d);
 | |
| 
 | |
| 			if (inter_d != (SEG *) NULL)
 | |
| 				pfree(inter_d);
 | |
| 
 | |
| 			/*
 | |
| 			 * are these a more promising split that what we've already
 | |
| 			 * seen?
 | |
| 			 */
 | |
| 
 | |
| 			if (size_waste > waste || firsttime)
 | |
| 			{
 | |
| 				waste = size_waste;
 | |
| 				seed_1 = i;
 | |
| 				seed_2 = j;
 | |
| 				firsttime = false;
 | |
| 			}
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	left = v->spl_left;
 | |
| 	v->spl_nleft = 0;
 | |
| 	right = v->spl_right;
 | |
| 	v->spl_nright = 0;
 | |
| 
 | |
| 	datum_alpha = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[seed_1].pred);
 | |
| 	datum_l = (SEG *) seg_union(datum_alpha, datum_alpha);
 | |
| 	rt_seg_size((SEG *) datum_l, &size_l);
 | |
| 	datum_beta = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[seed_2].pred);;
 | |
| 	datum_r = (SEG *) seg_union(datum_beta, datum_beta);
 | |
| 	rt_seg_size((SEG *) datum_r, &size_r);
 | |
| 
 | |
| 	/*
 | |
| 	 * Now split up the regions between the two seeds.	An important
 | |
| 	 * property of this split algorithm is that the split vector v has the
 | |
| 	 * indices of items to be split in order in its left and right
 | |
| 	 * vectors.  We exploit this property by doing a merge in the code
 | |
| 	 * that actually splits the page.
 | |
| 	 *
 | |
| 	 * For efficiency, we also place the new index tuple in this loop. This
 | |
| 	 * is handled at the very end, when we have placed all the existing
 | |
| 	 * tuples and i == maxoff + 1.
 | |
| 	 */
 | |
| 
 | |
| 	maxoff = OffsetNumberNext(maxoff);
 | |
| 	for (i = FirstOffsetNumber; i <= maxoff; i = OffsetNumberNext(i))
 | |
| 	{
 | |
| 
 | |
| 		/*
 | |
| 		 * If we've already decided where to place this item, just put it
 | |
| 		 * on the right list.  Otherwise, we need to figure out which page
 | |
| 		 * needs the least enlargement in order to store the item.
 | |
| 		 */
 | |
| 
 | |
| 		if (i == seed_1)
 | |
| 		{
 | |
| 			*left++ = i;
 | |
| 			v->spl_nleft++;
 | |
| 			continue;
 | |
| 		}
 | |
| 		else if (i == seed_2)
 | |
| 		{
 | |
| 			*right++ = i;
 | |
| 			v->spl_nright++;
 | |
| 			continue;
 | |
| 		}
 | |
| 
 | |
| 		/* okay, which page needs least enlargement? */
 | |
| 		datum_alpha = (SEG *) (((GISTENTRY *) (VARDATA(entryvec)))[i].pred);
 | |
| 		union_dl = (SEG *) seg_union(datum_l, datum_alpha);
 | |
| 		union_dr = (SEG *) seg_union(datum_r, datum_alpha);
 | |
| 		rt_seg_size((SEG *) union_dl, &size_alpha);
 | |
| 		rt_seg_size((SEG *) union_dr, &size_beta);
 | |
| 
 | |
| 		/* pick which page to add it to */
 | |
| 		if (size_alpha - size_l < size_beta - size_r)
 | |
| 		{
 | |
| 			pfree(datum_l);
 | |
| 			pfree(union_dr);
 | |
| 			datum_l = union_dl;
 | |
| 			size_l = size_alpha;
 | |
| 			*left++ = i;
 | |
| 			v->spl_nleft++;
 | |
| 		}
 | |
| 		else
 | |
| 		{
 | |
| 			pfree(datum_r);
 | |
| 			pfree(union_dl);
 | |
| 			datum_r = union_dr;
 | |
| 			size_r = size_alpha;
 | |
| 			*right++ = i;
 | |
| 			v->spl_nright++;
 | |
| 		}
 | |
| 	}
 | |
| 	*left = *right = FirstOffsetNumber; /* sentinel value, see dosplit() */
 | |
| 
 | |
| 	v->spl_ldatum = (char *) datum_l;
 | |
| 	v->spl_rdatum = (char *) datum_r;
 | |
| 
 | |
| 	return v;
 | |
| }
 | |
| 
 | |
| /*
 | |
| ** Equality methods
 | |
| */
 | |
| bool *
 | |
| gseg_same(SEG * b1, SEG * b2, bool *result)
 | |
| {
 | |
| 	if (seg_same(b1, b2))
 | |
| 		*result = TRUE;
 | |
| 	else
 | |
| 		*result = FALSE;
 | |
| 
 | |
| #ifdef GIST_DEBUG
 | |
| 	fprintf(stderr, "same: %s\n", (*result ? "TRUE" : "FALSE"));
 | |
| #endif
 | |
| 
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| /*
 | |
| ** SUPPORT ROUTINES
 | |
| */
 | |
| bool
 | |
| gseg_leaf_consistent(SEG * key,
 | |
| 					 SEG * query,
 | |
| 					 StrategyNumber strategy)
 | |
| {
 | |
| 	bool		retval;
 | |
| 
 | |
| #ifdef GIST_QUERY_DEBUG
 | |
| 	fprintf(stderr, "leaf_consistent, %d\n", strategy);
 | |
| #endif
 | |
| 
 | |
| 	switch (strategy)
 | |
| 	{
 | |
| 		case RTLeftStrategyNumber:
 | |
| 			retval = (bool) seg_left(key, query);
 | |
| 			break;
 | |
| 		case RTOverLeftStrategyNumber:
 | |
| 			retval = (bool) seg_over_left(key, query);
 | |
| 			break;
 | |
| 		case RTOverlapStrategyNumber:
 | |
| 			retval = (bool) seg_overlap(key, query);
 | |
| 			break;
 | |
| 		case RTOverRightStrategyNumber:
 | |
| 			retval = (bool) seg_over_right(key, query);
 | |
| 			break;
 | |
| 		case RTRightStrategyNumber:
 | |
| 			retval = (bool) seg_right(key, query);
 | |
| 			break;
 | |
| 		case RTSameStrategyNumber:
 | |
| 			retval = (bool) seg_same(key, query);
 | |
| 			break;
 | |
| 		case RTContainsStrategyNumber:
 | |
| 			retval = (bool) seg_contains(key, query);
 | |
| 			break;
 | |
| 		case RTContainedByStrategyNumber:
 | |
| 			retval = (bool) seg_contained(key, query);
 | |
| 			break;
 | |
| 		default:
 | |
| 			retval = FALSE;
 | |
| 	}
 | |
| 	return (retval);
 | |
| }
 | |
| 
 | |
| bool
 | |
| gseg_internal_consistent(SEG * key,
 | |
| 						 SEG * query,
 | |
| 						 StrategyNumber strategy)
 | |
| {
 | |
| 	bool		retval;
 | |
| 
 | |
| #ifdef GIST_QUERY_DEBUG
 | |
| 	fprintf(stderr, "internal_consistent, %d\n", strategy);
 | |
| #endif
 | |
| 
 | |
| 	switch (strategy)
 | |
| 	{
 | |
| 		case RTLeftStrategyNumber:
 | |
| 		case RTOverLeftStrategyNumber:
 | |
| 			retval = (bool) seg_over_left(key, query);
 | |
| 			break;
 | |
| 		case RTOverlapStrategyNumber:
 | |
| 			retval = (bool) seg_overlap(key, query);
 | |
| 			break;
 | |
| 		case RTOverRightStrategyNumber:
 | |
| 		case RTRightStrategyNumber:
 | |
| 			retval = (bool) seg_right(key, query);
 | |
| 			break;
 | |
| 		case RTSameStrategyNumber:
 | |
| 		case RTContainsStrategyNumber:
 | |
| 			retval = (bool) seg_contains(key, query);
 | |
| 			break;
 | |
| 		case RTContainedByStrategyNumber:
 | |
| 			retval = (bool) seg_overlap(key, query);
 | |
| 			break;
 | |
| 		default:
 | |
| 			retval = FALSE;
 | |
| 	}
 | |
| 	return (retval);
 | |
| }
 | |
| 
 | |
| SEG *
 | |
| gseg_binary_union(SEG * r1, SEG * r2, int *sizep)
 | |
| {
 | |
| 	SEG		   *retval;
 | |
| 
 | |
| 	retval = seg_union(r1, r2);
 | |
| 	*sizep = sizeof(SEG);
 | |
| 
 | |
| 	return (retval);
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| seg_contains(SEG * a, SEG * b)
 | |
| {
 | |
| 	return ((a->lower <= b->lower) && (a->upper >= b->upper));
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_contained(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (seg_contains(b, a));
 | |
| }
 | |
| 
 | |
| /*****************************************************************************
 | |
|  * Operator class for R-tree indexing
 | |
|  *****************************************************************************/
 | |
| 
 | |
| bool
 | |
| seg_same(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) == 0;
 | |
| }
 | |
| 
 | |
| /*	seg_overlap -- does a overlap b?
 | |
|  */
 | |
| bool
 | |
| seg_overlap(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (
 | |
| 			((a->upper >= b->upper) && (a->lower <= b->upper))
 | |
| 			||
 | |
| 			((b->upper >= a->upper) && (b->lower <= a->upper))
 | |
| 	);
 | |
| }
 | |
| 
 | |
| /*	seg_overleft -- is the right edge of (a) located to the left of the right edge of (b)?
 | |
|  */
 | |
| bool
 | |
| seg_over_left(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (a->upper <= b->upper && !seg_left(a, b) && !seg_right(a, b));
 | |
| }
 | |
| 
 | |
| /*	seg_left -- is (a) entirely on the left of (b)?
 | |
|  */
 | |
| bool
 | |
| seg_left(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (a->upper < b->lower);
 | |
| }
 | |
| 
 | |
| /*	seg_right -- is (a) entirely on the right of (b)?
 | |
|  */
 | |
| bool
 | |
| seg_right(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (a->lower > b->upper);
 | |
| }
 | |
| 
 | |
| /*	seg_overright -- is the left edge of (a) located to the right of the left edge of (b)?
 | |
|  */
 | |
| bool
 | |
| seg_over_right(SEG * a, SEG * b)
 | |
| {
 | |
| 	return (a->lower >= b->lower && !seg_left(a, b) && !seg_right(a, b));
 | |
| }
 | |
| 
 | |
| 
 | |
| SEG *
 | |
| seg_union(SEG * a, SEG * b)
 | |
| {
 | |
| 	SEG		   *n;
 | |
| 
 | |
| 	n = (SEG *) palloc(sizeof(*n));
 | |
| 
 | |
| 	/* take max of upper endpoints */
 | |
| 	if (a->upper > b->upper)
 | |
| 	{
 | |
| 		n->upper = a->upper;
 | |
| 		n->u_sigd = a->u_sigd;
 | |
| 		n->u_ext = a->u_ext;
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		n->upper = b->upper;
 | |
| 		n->u_sigd = b->u_sigd;
 | |
| 		n->u_ext = b->u_ext;
 | |
| 	}
 | |
| 
 | |
| 	/* take min of lower endpoints */
 | |
| 	if (a->lower < b->lower)
 | |
| 	{
 | |
| 		n->lower = a->lower;
 | |
| 		n->l_sigd = a->l_sigd;
 | |
| 		n->l_ext = a->l_ext;
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		n->lower = b->lower;
 | |
| 		n->l_sigd = b->l_sigd;
 | |
| 		n->l_ext = b->l_ext;
 | |
| 	}
 | |
| 
 | |
| 	return (n);
 | |
| }
 | |
| 
 | |
| 
 | |
| SEG *
 | |
| seg_inter(SEG * a, SEG * b)
 | |
| {
 | |
| 	SEG		   *n;
 | |
| 
 | |
| 	n = (SEG *) palloc(sizeof(*n));
 | |
| 
 | |
| 	/* take min of upper endpoints */
 | |
| 	if (a->upper < b->upper)
 | |
| 	{
 | |
| 		n->upper = a->upper;
 | |
| 		n->u_sigd = a->u_sigd;
 | |
| 		n->u_ext = a->u_ext;
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		n->upper = b->upper;
 | |
| 		n->u_sigd = b->u_sigd;
 | |
| 		n->u_ext = b->u_ext;
 | |
| 	}
 | |
| 
 | |
| 	/* take max of lower endpoints */
 | |
| 	if (a->lower > b->lower)
 | |
| 	{
 | |
| 		n->lower = a->lower;
 | |
| 		n->l_sigd = a->l_sigd;
 | |
| 		n->l_ext = a->l_ext;
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		n->lower = b->lower;
 | |
| 		n->l_sigd = b->l_sigd;
 | |
| 		n->l_ext = b->l_ext;
 | |
| 	}
 | |
| 
 | |
| 	return (n);
 | |
| }
 | |
| 
 | |
| void
 | |
| rt_seg_size(SEG * a, float *size)
 | |
| {
 | |
| 	if (a == (SEG *) NULL || a->upper <= a->lower)
 | |
| 		*size = 0.0;
 | |
| 	else
 | |
| 		*size = (float) abs(a->upper - a->lower);
 | |
| 
 | |
| 	return;
 | |
| }
 | |
| 
 | |
| float *
 | |
| seg_size(SEG * a)
 | |
| {
 | |
| 	float	   *result;
 | |
| 
 | |
| 	result = (float *) palloc(sizeof(float));
 | |
| 
 | |
| 	*result = (float) abs(a->upper - a->lower);
 | |
| 
 | |
| 	return (result);
 | |
| }
 | |
| 
 | |
| 
 | |
| /*****************************************************************************
 | |
|  *				   Miscellaneous operators
 | |
|  *****************************************************************************/
 | |
| int32
 | |
| seg_cmp(SEG * a, SEG * b)
 | |
| {
 | |
| 
 | |
| 	/*
 | |
| 	 * First compare on lower boundary position
 | |
| 	 */
 | |
| 	if (a->lower < b->lower)
 | |
| 		return -1;
 | |
| 	if (a->lower > b->lower)
 | |
| 		return 1;
 | |
| 
 | |
| 	/*
 | |
| 	 * a->lower == b->lower, so consider type of boundary.
 | |
| 	 *
 | |
| 	 * A '-' lower bound is < any other kind (this could only be relevant if
 | |
| 	 * -HUGE is used as a regular data value). A '<' lower bound is < any
 | |
| 	 * other kind except '-'. A '>' lower bound is > any other kind.
 | |
| 	 */
 | |
| 	if (a->l_ext != b->l_ext)
 | |
| 	{
 | |
| 		if (a->l_ext == '-')
 | |
| 			return -1;
 | |
| 		if (b->l_ext == '-')
 | |
| 			return 1;
 | |
| 		if (a->l_ext == '<')
 | |
| 			return -1;
 | |
| 		if (b->l_ext == '<')
 | |
| 			return 1;
 | |
| 		if (a->l_ext == '>')
 | |
| 			return 1;
 | |
| 		if (b->l_ext == '>')
 | |
| 			return -1;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * For other boundary types, consider # of significant digits first.
 | |
| 	 */
 | |
| 	if (a->l_sigd < b->l_sigd)	/* (a) is blurred and is likely to include
 | |
| 								 * (b) */
 | |
| 		return -1;
 | |
| 	if (a->l_sigd > b->l_sigd)	/* (a) is less blurred and is likely to be
 | |
| 								 * included in (b) */
 | |
| 		return 1;
 | |
| 
 | |
| 	/*
 | |
| 	 * For same # of digits, an approximate boundary is more blurred than
 | |
| 	 * exact.
 | |
| 	 */
 | |
| 	if (a->l_ext != b->l_ext)
 | |
| 	{
 | |
| 		if (a->l_ext == '~')	/* (a) is approximate, while (b) is exact */
 | |
| 			return -1;
 | |
| 		if (b->l_ext == '~')
 | |
| 			return 1;
 | |
| 		/* can't get here unless data is corrupt */
 | |
| 		elog(ERROR, "seg_cmp: bogus lower boundary types %d %d",
 | |
| 			 (int) a->l_ext, (int) b->l_ext);
 | |
| 	}
 | |
| 
 | |
| 	/* at this point, the lower boundaries are identical */
 | |
| 
 | |
| 	/*
 | |
| 	 * First compare on upper boundary position
 | |
| 	 */
 | |
| 	if (a->upper < b->upper)
 | |
| 		return -1;
 | |
| 	if (a->upper > b->upper)
 | |
| 		return 1;
 | |
| 
 | |
| 	/*
 | |
| 	 * a->upper == b->upper, so consider type of boundary.
 | |
| 	 *
 | |
| 	 * A '-' upper bound is > any other kind (this could only be relevant if
 | |
| 	 * HUGE is used as a regular data value). A '<' upper bound is < any
 | |
| 	 * other kind. A '>' upper bound is > any other kind except '-'.
 | |
| 	 */
 | |
| 	if (a->u_ext != b->u_ext)
 | |
| 	{
 | |
| 		if (a->u_ext == '-')
 | |
| 			return 1;
 | |
| 		if (b->u_ext == '-')
 | |
| 			return -1;
 | |
| 		if (a->u_ext == '<')
 | |
| 			return -1;
 | |
| 		if (b->u_ext == '<')
 | |
| 			return 1;
 | |
| 		if (a->u_ext == '>')
 | |
| 			return 1;
 | |
| 		if (b->u_ext == '>')
 | |
| 			return -1;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * For other boundary types, consider # of significant digits first.
 | |
| 	 * Note result here is converse of the lower-boundary case.
 | |
| 	 */
 | |
| 	if (a->u_sigd < b->u_sigd)	/* (a) is blurred and is likely to include
 | |
| 								 * (b) */
 | |
| 		return 1;
 | |
| 	if (a->u_sigd > b->u_sigd)	/* (a) is less blurred and is likely to be
 | |
| 								 * included in (b) */
 | |
| 		return -1;
 | |
| 
 | |
| 	/*
 | |
| 	 * For same # of digits, an approximate boundary is more blurred than
 | |
| 	 * exact.  Again, result is converse of lower-boundary case.
 | |
| 	 */
 | |
| 	if (a->u_ext != b->u_ext)
 | |
| 	{
 | |
| 		if (a->u_ext == '~')	/* (a) is approximate, while (b) is exact */
 | |
| 			return 1;
 | |
| 		if (b->u_ext == '~')
 | |
| 			return -1;
 | |
| 		/* can't get here unless data is corrupt */
 | |
| 		elog(ERROR, "seg_cmp: bogus upper boundary types %d %d",
 | |
| 			 (int) a->u_ext, (int) b->u_ext);
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_lt(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) < 0;
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_le(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) <= 0;
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_gt(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) > 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| bool
 | |
| seg_ge(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) >= 0;
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_different(SEG * a, SEG * b)
 | |
| {
 | |
| 	return seg_cmp(a, b) != 0;
 | |
| }
 | |
| 
 | |
| 
 | |
| 
 | |
| /*****************************************************************************
 | |
|  *				   Auxiliary functions
 | |
|  *****************************************************************************/
 | |
| 
 | |
| /* The purpose of this routine is to print the floating point
 | |
|  * value with exact number of significant digits. Its behaviour
 | |
|  * is similar to %.ng except it prints 8.00 where %.ng would
 | |
|  * print 8
 | |
|  */
 | |
| static int
 | |
| restore(char *result, float val, int n)
 | |
| {
 | |
| 	static char efmt[8] = {'%', '-', '1', '5', '.', '#', 'e', 0};
 | |
| 	char		buf[25] = {
 | |
| 		'0', '0', '0', '0', '0',
 | |
| 		'0', '0', '0', '0', '0',
 | |
| 		'0', '0', '0', '0', '0',
 | |
| 		'0', '0', '0', '0', '0',
 | |
| 		'0', '0', '0', '0', '\0'
 | |
| 	};
 | |
| 	char	   *p;
 | |
| 	char	   *mant;
 | |
| 	int			exp;
 | |
| 	int			i,
 | |
| 				dp,
 | |
| 				sign;
 | |
| 
 | |
| 	/*
 | |
| 	 * put a cap on the number of siugnificant digits to avoid nonsense in
 | |
| 	 * the output
 | |
| 	 */
 | |
| 	n = min(n, FLT_DIG);
 | |
| 
 | |
| 	/* remember the sign */
 | |
| 	sign = (val < 0 ? 1 : 0);
 | |
| 
 | |
| 	efmt[5] = '0' + (n - 1) % 10;		/* makes %-15.(n-1)e -- this
 | |
| 										 * format guarantees that the
 | |
| 										 * exponent is always present */
 | |
| 
 | |
| 	sprintf(result, efmt, val);
 | |
| 
 | |
| 	/* trim the spaces left by the %e */
 | |
| 	for (p = result; *p != ' '; p++);
 | |
| 	*p = '\0';
 | |
| 
 | |
| 	/* get the exponent */
 | |
| 	mant = (char *) strtok(strdup(result), "e");
 | |
| 	exp = atoi(strtok(NULL, "e"));
 | |
| 
 | |
| 	if (exp == 0)
 | |
| 	{
 | |
| 		/* use the supplied mantyssa with sign */
 | |
| 		strcpy((char *) index(result, 'e'), "");
 | |
| 	}
 | |
| 	else
 | |
| 	{
 | |
| 		if (abs(exp) <= 4)
 | |
| 		{
 | |
| 
 | |
| 			/*
 | |
| 			 * remove the decimal point from the mantyssa and write the
 | |
| 			 * digits to the buf array
 | |
| 			 */
 | |
| 			for (p = result + sign, i = 10, dp = 0; *p != 'e'; p++, i++)
 | |
| 			{
 | |
| 				buf[i] = *p;
 | |
| 				if (*p == '.')
 | |
| 				{
 | |
| 					dp = i--;	/* skip the decimal point */
 | |
| 				}
 | |
| 			}
 | |
| 			if (dp == 0)
 | |
| 				dp = i--;		/* no decimal point was found in the above
 | |
| 								 * for() loop */
 | |
| 
 | |
| 			if (exp > 0)
 | |
| 			{
 | |
| 				if (dp - 10 + exp >= n)
 | |
| 				{
 | |
| 
 | |
| 					/*
 | |
| 					 * the decimal point is behind the last significant
 | |
| 					 * digit; the digits in between must be converted to
 | |
| 					 * the exponent and the decimal point placed after the
 | |
| 					 * first digit
 | |
| 					 */
 | |
| 					exp = dp - 10 + exp - n;
 | |
| 					buf[10 + n] = '\0';
 | |
| 
 | |
| 					/* insert the decimal point */
 | |
| 					if (n > 1)
 | |
| 					{
 | |
| 						dp = 11;
 | |
| 						for (i = 23; i > dp; i--)
 | |
| 							buf[i] = buf[i - 1];
 | |
| 						buf[dp] = '.';
 | |
| 					}
 | |
| 
 | |
| 					/*
 | |
| 					 * adjust the exponent by the number of digits after
 | |
| 					 * the decimal point
 | |
| 					 */
 | |
| 					if (n > 1)
 | |
| 						sprintf(&buf[11 + n], "e%d", exp + n - 1);
 | |
| 					else
 | |
| 						sprintf(&buf[11], "e%d", exp + n - 1);
 | |
| 
 | |
| 					if (sign)
 | |
| 					{
 | |
| 						buf[9] = '-';
 | |
| 						strcpy(result, &buf[9]);
 | |
| 					}
 | |
| 					else
 | |
| 						strcpy(result, &buf[10]);
 | |
| 				}
 | |
| 				else
 | |
| 				{				/* insert the decimal point */
 | |
| 					dp += exp;
 | |
| 					for (i = 23; i > dp; i--)
 | |
| 						buf[i] = buf[i - 1];
 | |
| 					buf[11 + n] = '\0';
 | |
| 					buf[dp] = '.';
 | |
| 					if (sign)
 | |
| 					{
 | |
| 						buf[9] = '-';
 | |
| 						strcpy(result, &buf[9]);
 | |
| 					}
 | |
| 					else
 | |
| 						strcpy(result, &buf[10]);
 | |
| 				}
 | |
| 			}
 | |
| 			else
 | |
| 			{					/* exp <= 0 */
 | |
| 				dp += exp - 1;
 | |
| 				buf[10 + n] = '\0';
 | |
| 				buf[dp] = '.';
 | |
| 				if (sign)
 | |
| 				{
 | |
| 					buf[dp - 2] = '-';
 | |
| 					strcpy(result, &buf[dp - 2]);
 | |
| 				}
 | |
| 				else
 | |
| 					strcpy(result, &buf[dp - 1]);
 | |
| 			}
 | |
| 		}
 | |
| 
 | |
| 		/* do nothing for abs(exp) > 4; %e must be OK */
 | |
| 		/* just get rid of zeroes after [eE]- and +zeroes after [Ee]. */
 | |
| 
 | |
| 		/* ... this is not done yet. */
 | |
| 	}
 | |
| 	return (strlen(result));
 | |
| }
 | |
| 
 | |
| 
 | |
| /*
 | |
| ** Miscellany
 | |
| */
 | |
| 
 | |
| bool
 | |
| seg_contains_int(SEG * a, int *b)
 | |
| {
 | |
| 	return ((a->lower <= *b) && (a->upper >= *b));
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_contains_float4(SEG * a, float4 *b)
 | |
| {
 | |
| 	return ((a->lower <= *b) && (a->upper >= *b));
 | |
| }
 | |
| 
 | |
| bool
 | |
| seg_contains_float8(SEG * a, float8 *b)
 | |
| {
 | |
| 	return ((a->lower <= *b) && (a->upper >= *b));
 | |
| }
 | |
| 
 | |
| /* find out the number of significant digits in a string representing
 | |
|  * a floating point number
 | |
|  */
 | |
| int
 | |
| significant_digits(char *s)
 | |
| {
 | |
| 	char	   *p = s;
 | |
| 	int			n,
 | |
| 				c,
 | |
| 				zeroes;
 | |
| 
 | |
| 	zeroes = 1;
 | |
| 	/* skip leading zeroes and sign */
 | |
| 	for (c = *p; (c == '0' || c == '+' || c == '-') && c != 0; c = *(++p));
 | |
| 
 | |
| 	/* skip decimal point and following zeroes */
 | |
| 	for (c = *p; (c == '0' || c == '.') && c != 0; c = *(++p))
 | |
| 	{
 | |
| 		if (c != '.')
 | |
| 			zeroes++;
 | |
| 	}
 | |
| 
 | |
| 	/* count significant digits (n) */
 | |
| 	for (c = *p, n = 0; c != 0; c = *(++p))
 | |
| 	{
 | |
| 		if (!((c >= '0' && c <= '9') || (c == '.')))
 | |
| 			break;
 | |
| 		if (c != '.')
 | |
| 			n++;
 | |
| 	}
 | |
| 
 | |
| 	if (!n)
 | |
| 		return (zeroes);
 | |
| 
 | |
| 	return (n);
 | |
| }
 |