mirror of
https://github.com/sqlite/sqlite.git
synced 2025-07-30 19:03:16 +03:00
Bug fix in the FTS1 snippet generator. Improvements in the way the snippet
generator handles whitespace. (CVS 3448) FossilOrigin-Name: d3f4ae827582bd0aac54ae3211d272a1429b6523
This commit is contained in:
@ -2298,6 +2298,27 @@ static int wordBoundary(
|
||||
return iBreak;
|
||||
}
|
||||
|
||||
/*
|
||||
** If the StringBuffer does not end in white space, add a single
|
||||
** space character to the end.
|
||||
*/
|
||||
static void appendWhiteSpace(StringBuffer *p){
|
||||
if( p->len==0 ) return;
|
||||
if( isspace(p->s[p->len-1]) ) return;
|
||||
append(p, " ");
|
||||
}
|
||||
|
||||
/*
|
||||
** Remove white space from teh end of the StringBuffer
|
||||
*/
|
||||
static void trimWhiteSpace(StringBuffer *p){
|
||||
while( p->len>0 && isspace(p->s[p->len-1]) ){
|
||||
p->len--;
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
|
||||
/*
|
||||
** Allowed values for Snippet.aMatch[].snStatus
|
||||
*/
|
||||
@ -2369,8 +2390,12 @@ static void snippetText(
|
||||
wantEllipsis = 0;
|
||||
tailEllipsis = 0;
|
||||
}
|
||||
if( iCol!=tailCol || iStart!=tailOffset ){
|
||||
appendWhiteSpace(&sb);
|
||||
}
|
||||
if( wantEllipsis || tailEllipsis ){
|
||||
append(&sb, zEllipsis);
|
||||
appendWhiteSpace(&sb);
|
||||
}
|
||||
iEnd = aMatch[i].iStart + aMatch[i].nByte + 40;
|
||||
iEnd = wordBoundary(iEnd, zDoc, nDoc, aMatch, nMatch, iCol);
|
||||
@ -2382,8 +2407,12 @@ static void snippetText(
|
||||
}
|
||||
while( iMatch<nMatch && aMatch[iMatch].iCol<iCol ){ iMatch++; }
|
||||
while( iStart<iEnd ){
|
||||
while( iMatch<nMatch && aMatch[iMatch].iStart<iStart ){ iMatch++; }
|
||||
if( iMatch<nMatch && aMatch[iMatch].iStart<iEnd ){
|
||||
while( iMatch<nMatch && aMatch[iMatch].iStart<iStart
|
||||
&& aMatch[iMatch].iCol<=iCol ){
|
||||
iMatch++;
|
||||
}
|
||||
if( iMatch<nMatch && aMatch[iMatch].iStart<iEnd
|
||||
&& aMatch[iMatch].iCol==iCol ){
|
||||
nappend(&sb, &zDoc[iStart], aMatch[iMatch].iStart - iStart);
|
||||
iStart = aMatch[iMatch].iStart;
|
||||
append(&sb, zStartMark);
|
||||
@ -2405,7 +2434,9 @@ static void snippetText(
|
||||
tailCol = iCol;
|
||||
tailOffset = iEnd;
|
||||
}
|
||||
trimWhiteSpace(&sb);
|
||||
if( tailEllipsis ){
|
||||
appendWhiteSpace(&sb);
|
||||
append(&sb, zEllipsis);
|
||||
}
|
||||
pCursor->snippet.zSnippet = sb.s;
|
||||
|
14
manifest
14
manifest
@ -1,5 +1,5 @@
|
||||
C Avoid\ssegfaults\swhen\sinserted\sNULL\svalues\sinto\sFTS1.\s(CVS\s3447)
|
||||
D 2006-09-28T11:41:41
|
||||
C Bug\sfix\sin\sthe\sFTS1\ssnippet\sgenerator.\s\sImprovements\sin\sthe\sway\sthe\ssnippet\ngenerator\shandles\swhitespace.\s(CVS\s3448)
|
||||
D 2006-09-28T18:37:16
|
||||
F Makefile.in cabd42d34340f49260bc2a7668c38eba8d4cfd99
|
||||
F Makefile.linux-gcc 2d8574d1ba75f129aba2019f0b959db380a90935
|
||||
F README 9c4e2d6706bdcc3efdd773ce752a8cdab4f90028
|
||||
@ -21,7 +21,7 @@ F ext/README.txt 913a7bd3f4837ab14d7e063304181787658b14e1
|
||||
F ext/fts1/README.txt 20ac73b006a70bcfd80069bdaf59214b6cf1db5e
|
||||
F ext/fts1/ft_hash.c 3927bd880e65329bdc6f506555b228b28924921b
|
||||
F ext/fts1/ft_hash.h 1a35e654a235c2c662d3ca0dfc3138ad60b8b7d5
|
||||
F ext/fts1/fts1.c 5cb7829d331502a3151d6648cadd358ac97b5161
|
||||
F ext/fts1/fts1.c 8531a2a86cc9a29d0b47762243e04f8e45655d33
|
||||
F ext/fts1/fts1.h 6060b8f62c1d925ea8356cb1a6598073eb9159a6
|
||||
F ext/fts1/fts1_hash.c 3196cee866edbebb1c0521e21672e6d599965114
|
||||
F ext/fts1/fts1_hash.h 957d378355ed29f672cd5add012ce8b088a5e089
|
||||
@ -192,7 +192,7 @@ F test/fkey1.test 153004438d51e6769fb1ce165f6313972d6263ce
|
||||
F test/format4.test bf3bed3b13c63abfb3cfec232597a319a31d0bcc
|
||||
F test/fts1a.test 8fa66282a2a297faebdab76279c1693eb7920a3b
|
||||
F test/fts1b.test 5d8a01aefbecc8b7442b36c94c05eb7a845462d5
|
||||
F test/fts1c.test a57cb192d59ddacba64d17c326ff99393c181dc6
|
||||
F test/fts1c.test 3e1ad5a8b9118ba2970e6e4572cbc0f0d952d184
|
||||
F test/func.test 0ed54b5aeaad319f68016c033acfebef56f5874a
|
||||
F test/hook.test 7e7645fd9a033f79cce8fdff151e32715e7ec50a
|
||||
F test/in.test 369cb2aa1eab02296b4ec470732fe8c131260b1d
|
||||
@ -399,7 +399,7 @@ F www/tclsqlite.tcl bb0d1357328a42b1993d78573e587c6dcbc964b9
|
||||
F www/vdbe.tcl 87a31ace769f20d3627a64fa1fade7fed47b90d0
|
||||
F www/version3.tcl 890248cf7b70e60c383b0e84d77d5132b3ead42b
|
||||
F www/whentouse.tcl 97e2b5cd296f7d8057e11f44427dea8a4c2db513
|
||||
P 944d5f812004e2dc0065fce267accf8907235a50
|
||||
R a3b9f1ec905300375312507d7a2e50ec
|
||||
P 165645d30115f3171fc45489823f85639fe2bfcd
|
||||
R 02e1bfc3de0db0fdbc150a5e5d77d065
|
||||
U drh
|
||||
Z e44db4ed3c8a0588eb2a24973c8a730d
|
||||
Z 838ab44cedca04109db513f0d883f765
|
||||
|
@ -1 +1 @@
|
||||
165645d30115f3171fc45489823f85639fe2bfcd
|
||||
d3f4ae827582bd0aac54ae3211d272a1429b6523
|
@ -11,7 +11,7 @@
|
||||
# This file implements regression tests for SQLite library. The
|
||||
# focus of this script is testing the FTS1 module.
|
||||
#
|
||||
# $Id: fts1c.test,v 1.7 2006/09/21 02:03:11 drh Exp $
|
||||
# $Id: fts1c.test,v 1.8 2006/09/28 18:37:16 drh Exp $
|
||||
#
|
||||
|
||||
set testdir [file dirname $argv0]
|
||||
@ -1131,22 +1131,18 @@ do_test fts1c-4.2 {
|
||||
SELECT snippet(email) FROM email
|
||||
WHERE email MATCH 'christmas candlelight'
|
||||
}
|
||||
} {{<b>...</b>place.? What do you think about going here <b>Christmas</b>
|
||||
} {{<b>...</b> place.? What do you think about going here <b>Christmas</b>
|
||||
eve?? They have an 11:00 a.m. service and a <b>candlelight</b> service at 5:00 p.m.,
|
||||
among others.
|
||||
|
||||
<b>...</b>}}
|
||||
among others. <b>...</b>}}
|
||||
|
||||
do_test fts1c-4.3 {
|
||||
execsql {
|
||||
SELECT snippet(email) FROM email
|
||||
WHERE email MATCH 'deal sheet potential reuse'
|
||||
}
|
||||
} {{EOL-Accenture <b>Deal</b> <b>Sheet</b><b>...</b>intent
|
||||
} {{EOL-Accenture <b>Deal</b> <b>Sheet</b> <b>...</b> intent
|
||||
Review Enron asset base for <b>potential</b> <b>reuse</b>/ licensing
|
||||
Contract negotiations
|
||||
|
||||
<b>...</b>}}
|
||||
Contract negotiations <b>...</b>}}
|
||||
do_test fts1c-4.4 {
|
||||
execsql {
|
||||
SELECT snippet(email,'<<<','>>>',' ') FROM email
|
||||
@ -1154,8 +1150,12 @@ do_test fts1c-4.4 {
|
||||
}
|
||||
} {{EOL-Accenture <<<Deal>>> <<<Sheet>>> intent
|
||||
Review Enron asset base for <<<potential>>> <<<reuse>>>/ licensing
|
||||
Contract negotiations
|
||||
|
||||
}}
|
||||
Contract negotiations }}
|
||||
do_test fts1c-4.5 {
|
||||
execsql {
|
||||
SELECT snippet(email,'<<<','>>>',' ') FROM email
|
||||
WHERE email MATCH 'first things'
|
||||
}
|
||||
} {{Re: <<<First>>> Polish Deal! Congrats! <<<Things>>> seem to be building rapidly now on the }}
|
||||
|
||||
finish_test
|
||||
|
Reference in New Issue
Block a user