mirror of
https://github.com/postgres/postgres.git
synced 2025-04-22 23:02:54 +03:00
436 lines
6.9 KiB
C
436 lines
6.9 KiB
C
/* ----------
|
|
* lztext.c -
|
|
*
|
|
* $Header: /cvsroot/pgsql/src/backend/utils/adt/Attic/lztext.c,v 1.5 1999/12/28 13:40:48 wieck Exp $
|
|
*
|
|
* Text type with internal LZ compressed representation. Uses the
|
|
* standard PostgreSQL compression method.
|
|
*
|
|
* This code requires that the LZ compressor found in pg_lzcompress
|
|
* codes a usable VARSIZE word at the beginning of the output buffer.
|
|
* ----------
|
|
*/
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <math.h>
|
|
#include <errno.h>
|
|
|
|
#include "postgres.h"
|
|
#include "utils/builtins.h"
|
|
#include "utils/palloc.h"
|
|
#include "utils/pg_lzcompress.h"
|
|
#ifdef MULTIBYTE
|
|
#include "mb/pg_wchar.h"
|
|
#endif
|
|
|
|
/* ----------
|
|
* lztextin -
|
|
*
|
|
* Input function for datatype lztext
|
|
* ----------
|
|
*/
|
|
lztext *
|
|
lztextin(char *str)
|
|
{
|
|
lztext *result;
|
|
int32 rawsize;
|
|
lztext *tmp;
|
|
int tmp_size;
|
|
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (str == NULL)
|
|
return NULL;
|
|
|
|
/* ----------
|
|
* Determine input size and maximum output Datum size
|
|
* ----------
|
|
*/
|
|
rawsize = strlen(str);
|
|
tmp_size = PGLZ_MAX_OUTPUT(rawsize);
|
|
|
|
/* ----------
|
|
* Allocate a temporary result and compress into it
|
|
* ----------
|
|
*/
|
|
tmp = (lztext *) palloc(tmp_size);
|
|
pglz_compress(str, rawsize, tmp, NULL);
|
|
|
|
/* ----------
|
|
* If we miss less than 25% bytes at the end of the temp value,
|
|
* so be it. Therefore we save a palloc()/memcpy()/pfree()
|
|
* sequence.
|
|
* ----------
|
|
*/
|
|
if (tmp_size - tmp->varsize < 256 ||
|
|
tmp_size - tmp->varsize < tmp_size / 4)
|
|
{
|
|
result = tmp;
|
|
} else {
|
|
result = (lztext *) palloc(tmp->varsize);
|
|
memcpy(result, tmp, tmp->varsize);
|
|
pfree(tmp);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztextout -
|
|
*
|
|
* Output function for data type lztext
|
|
* ----------
|
|
*/
|
|
char *
|
|
lztextout(lztext *lz)
|
|
{
|
|
char *result;
|
|
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (lz == NULL)
|
|
{
|
|
result = (char *) palloc(2);
|
|
result[0] = '-';
|
|
result[1] = '\0';
|
|
return result;
|
|
}
|
|
|
|
/* ----------
|
|
* Allocate the result string - the required size is remembered
|
|
* in the lztext header so we don't need a temporary buffer or
|
|
* have to diddle with realloc's.
|
|
* ----------
|
|
*/
|
|
result = (char *) palloc(PGLZ_RAW_SIZE(lz) + 1);
|
|
|
|
/* ----------
|
|
* Decompress and add terminating ZERO
|
|
* ----------
|
|
*/
|
|
pglz_decompress(lz, result);
|
|
result[lz->rawsize] = '\0';
|
|
|
|
/* ----------
|
|
* Return the result
|
|
* ----------
|
|
*/
|
|
return result;
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztextlen -
|
|
*
|
|
* Logical length of lztext field (it's the uncompressed size
|
|
* of the original data).
|
|
* ----------
|
|
*/
|
|
int32
|
|
lztextlen(lztext *lz)
|
|
{
|
|
#ifdef MULTIBYTE
|
|
unsigned char *s1,*s2;
|
|
int len;
|
|
int l;
|
|
int wl;
|
|
#endif
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (lz == NULL)
|
|
return 0;
|
|
|
|
#ifdef MULTIBYTE
|
|
len = 0;
|
|
s1 = s2 = (unsigned char *)lztextout(lz);
|
|
l = PGLZ_RAW_SIZE(lz);
|
|
while (l > 0)
|
|
{
|
|
wl = pg_mblen(s1);
|
|
l -= wl;
|
|
s1 += wl;
|
|
len++;
|
|
}
|
|
pfree((char *)s2);
|
|
return (len);
|
|
#else
|
|
/* ----------
|
|
* without multibyte support, it's the remembered rawsize
|
|
* ----------
|
|
*/
|
|
return PGLZ_RAW_SIZE(lz);
|
|
#endif
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztextoctetlen -
|
|
*
|
|
* Physical length of lztext field (it's the compressed size
|
|
* plus the rawsize field).
|
|
* ----------
|
|
*/
|
|
int32
|
|
lztextoctetlen(lztext *lz)
|
|
{
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (lz == NULL)
|
|
return 0;
|
|
|
|
/* ----------
|
|
* Return the varsize minus the VARSIZE field itself.
|
|
* ----------
|
|
*/
|
|
return VARSIZE(lz) - VARHDRSZ;
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* text_lztext -
|
|
*
|
|
* Convert text to lztext
|
|
* ----------
|
|
*/
|
|
lztext *
|
|
text_lztext(text *txt)
|
|
{
|
|
lztext *result;
|
|
int32 rawsize;
|
|
lztext *tmp;
|
|
int tmp_size;
|
|
char *str;
|
|
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (txt == NULL)
|
|
return NULL;
|
|
|
|
/* ----------
|
|
* Determine input size and eventually tuple size
|
|
* ----------
|
|
*/
|
|
rawsize = VARSIZE(txt) - VARHDRSZ;
|
|
str = VARDATA(txt);
|
|
tmp_size = PGLZ_MAX_OUTPUT(rawsize);
|
|
|
|
/* ----------
|
|
* Allocate a temporary result and compress into it
|
|
* ----------
|
|
*/
|
|
tmp = (lztext *) palloc(tmp_size);
|
|
pglz_compress(str, rawsize, tmp, NULL);
|
|
|
|
/* ----------
|
|
* If we miss less than 25% bytes at the end of the temp value,
|
|
* so be it. Therefore we save a palloc()/memcpy()/pfree()
|
|
* sequence.
|
|
* ----------
|
|
*/
|
|
if (tmp_size - tmp->varsize < 256 ||
|
|
tmp_size - tmp->varsize < tmp_size / 4)
|
|
{
|
|
result = tmp;
|
|
} else {
|
|
result = (lztext *) palloc(tmp->varsize);
|
|
memcpy(result, tmp, tmp->varsize);
|
|
pfree(tmp);
|
|
}
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztext_text -
|
|
*
|
|
* Convert lztext to text
|
|
* ----------
|
|
*/
|
|
text *
|
|
lztext_text(lztext *lz)
|
|
{
|
|
text *result;
|
|
|
|
/* ----------
|
|
* Handle NULL
|
|
* ----------
|
|
*/
|
|
if (lz == NULL)
|
|
return NULL;
|
|
|
|
/* ----------
|
|
* Allocate and initialize the text result
|
|
* ----------
|
|
*/
|
|
result = (text *) palloc(PGLZ_RAW_SIZE(lz) + VARHDRSZ + 1);
|
|
VARSIZE(result) = lz->rawsize + VARHDRSZ;
|
|
|
|
/* ----------
|
|
* Decompress directly into the text data area.
|
|
* ----------
|
|
*/
|
|
VARDATA(result)[lz->rawsize] = 0;
|
|
pglz_decompress(lz, VARDATA(result));
|
|
|
|
return result;
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztext_cmp -
|
|
*
|
|
* Comparision function for two lztext datum's.
|
|
*
|
|
* Returns -1, 0 or 1.
|
|
* ----------
|
|
*/
|
|
int32
|
|
lztext_cmp(lztext *lz1, lztext *lz2)
|
|
{
|
|
#ifdef USE_LOCALE
|
|
|
|
char *cp1;
|
|
char *cp2;
|
|
int result;
|
|
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return (int32)0;
|
|
|
|
cp1 = lztextout(lz1);
|
|
cp2 = lztextout(lz2);
|
|
|
|
result = strcoll(cp1, cp2);
|
|
|
|
pfree(cp1);
|
|
pfree(cp2);
|
|
|
|
return result;
|
|
|
|
#else /* !USE_LOCALE */
|
|
|
|
PGLZ_DecompState ds1;
|
|
PGLZ_DecompState ds2;
|
|
int c1;
|
|
int c2;
|
|
int32 result = (int32)0;
|
|
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return (int32)0;
|
|
|
|
pglz_decomp_init(&ds1, lz1);
|
|
pglz_decomp_init(&ds2, lz2);
|
|
|
|
for(;;)
|
|
{
|
|
c1 = pglz_decomp_getchar(&ds1);
|
|
c2 = pglz_decomp_getchar(&ds2);
|
|
|
|
if (c1 == EOF)
|
|
{
|
|
if (c2 != EOF)
|
|
result = (int32)-1;
|
|
break;
|
|
} else {
|
|
if (c2 == EOF)
|
|
{
|
|
result = (int32)1;
|
|
}
|
|
}
|
|
if (c1 != c2)
|
|
{
|
|
result = (int32)(c1 - c2);
|
|
break;
|
|
}
|
|
}
|
|
|
|
pglz_decomp_end(&ds1);
|
|
pglz_decomp_end(&ds2);
|
|
|
|
return result;
|
|
|
|
#endif /* USE_LOCALE */
|
|
}
|
|
|
|
|
|
/* ----------
|
|
* lztext_eq ... -
|
|
*
|
|
* =, !=, >, >=, < and <= operator functions for two
|
|
* lztext datums.
|
|
* ----------
|
|
*/
|
|
bool
|
|
lztext_eq(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) == 0);
|
|
}
|
|
|
|
|
|
bool
|
|
lztext_ne(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) != 0);
|
|
}
|
|
|
|
|
|
bool
|
|
lztext_gt(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) > 0);
|
|
}
|
|
|
|
|
|
bool
|
|
lztext_ge(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) >= 0);
|
|
}
|
|
|
|
|
|
bool
|
|
lztext_lt(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) < 0);
|
|
}
|
|
|
|
|
|
bool
|
|
lztext_le(lztext *lz1, lztext *lz2)
|
|
{
|
|
if (lz1 == NULL || lz2 == NULL)
|
|
return false;
|
|
|
|
return (bool)(lztext_cmp(lz1, lz2) <= 0);
|
|
}
|
|
|
|
|