Skip to content
Snippets Groups Projects
Commit c7faf451 authored by Teodor Sigaev's avatar Teodor Sigaev
Browse files

Add more strict check of stop and non-recognized words,

allow only recognized words in thezaurus configuration file.
parent d77df813
No related branches found
No related tags found
No related merge requests found
/* $PostgreSQL: pgsql/contrib/tsearch2/dict_thesaurus.c,v 1.1 2006/05/31 14:05:31 teodor Exp $ */ /* $PostgreSQL: pgsql/contrib/tsearch2/dict_thesaurus.c,v 1.2 2006/06/02 15:35:42 teodor Exp $ */
/* /*
* thesaurus * thesaurus
...@@ -330,8 +330,12 @@ compileTheLexeme(DictThesaurus *d) { ...@@ -330,8 +330,12 @@ compileTheLexeme(DictThesaurus *d) {
); );
if ( !(ptr && ptr->lexeme) ) { if ( !(ptr && ptr->lexeme) ) {
if ( !ptr )
elog(NOTICE,"Thesaurus: word '%s' isn't recognized by subdictionary", d->wrds[i].lexeme);
else
elog(ERROR,"Thesaurus: word '%s' is recognized as stop-word, assign any stop-word", d->wrds[i].lexeme);
newwrds = addCompiledLexeme( newwrds, &nnw, &tnm, NULL, d->wrds[i].entries, 0); newwrds = addCompiledLexeme( newwrds, &nnw, &tnm, NULL, d->wrds[i].entries, 0);
elog(NOTICE,"Thesaurus: word '%s' isn't recognized by subdictionary or it's a stop-word, assign any non-recognized word", d->wrds[i].lexeme);
} else { } else {
while( ptr->lexeme ) { while( ptr->lexeme ) {
TSLexeme *remptr = ptr+1; TSLexeme *remptr = ptr+1;
...@@ -420,7 +424,7 @@ compileTheSubstitute(DictThesaurus *d) { ...@@ -420,7 +424,7 @@ compileTheSubstitute(DictThesaurus *d) {
); );
reml = lexized; reml = lexized;
if ( lexized ) { if ( lexized && lexized->lexeme ) {
int toset = (lexized->lexeme && outptr != d->subst[i].res ) ? (outptr - d->subst[i].res) : -1; int toset = (lexized->lexeme && outptr != d->subst[i].res ) ? (outptr - d->subst[i].res) : -1;
while( lexized->lexeme ) { while( lexized->lexeme ) {
...@@ -443,6 +447,8 @@ compileTheSubstitute(DictThesaurus *d) { ...@@ -443,6 +447,8 @@ compileTheSubstitute(DictThesaurus *d) {
if ( toset > 0) if ( toset > 0)
d->subst[i].res[toset].flags |= TSL_ADDPOS; d->subst[i].res[toset].flags |= TSL_ADDPOS;
} else {
elog(NOTICE,"Thesaurus: word '%s' isn't recognized by subdictionary or it's a stop-word, ignored", inptr->lexeme);
} }
if ( inptr->lexeme ) if ( inptr->lexeme )
...@@ -450,6 +456,9 @@ compileTheSubstitute(DictThesaurus *d) { ...@@ -450,6 +456,9 @@ compileTheSubstitute(DictThesaurus *d) {
inptr++; inptr++;
} }
if ( outptr == d->subst[i].res )
elog(ERROR,"Thesaurus: all words in subsitution aren't recognized by subdictionary");
d->subst[i].reslen = outptr - d->subst[i].res; d->subst[i].reslen = outptr - d->subst[i].res;
free(rem); free(rem);
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment