postgresql/contrib/tsearch/morph.c

/*
 * morphology module
 * New dictionary is include in dict.h. For languages which
 * use latin charset it may be need to modify mapdict table.
 * Teodor Sigaev <teodor@stack.net>
 */
#include "postgres.h"

#include <locale.h>

#include "utils/builtins.h"

#include "morph.h"
#include "deflex.h"

/*
 * Struct for calling dictionaries
 * All of this methods are optional, but
 * if all methods are NULL, then dictionary does nothing :)
 * Return value of lemmatize must be palloced or the same.
 * Return value of init must be malloced in other case
 * it will be free in end of transaction!
 */
typedef struct
{
	char		localename[NAMEDATALEN];
	/* init dictionary */
	void	   *(*init) (void);
	/* close dictionary */
	void		(*close) (void *);
	/* find in dictionary */
	char	   *(*lemmatize) (void *, char *, int *);
	int			(*is_stoplemm) (void *, char *, int);
	int			(*is_stemstoplemm) (void *, char *, int);
}	DICT;

/* insert all dictionaries */
#define DICT_BODY
#include "dict.h"
#undef	DICT_BODY

/* fill dictionary's structure */
#define DICT_TABLE
DICT		dicts[] = {
	{
		"C", NULL, NULL, NULL, NULL, NULL		/* fake dictionary */
	}
#include "dict.h"
};

#undef DICT_TABLE

/* array for storing dictionary's objects (if needed) */
void	   *dictobjs[
					 lengthof(dicts)];

#define STOPLEXEM	-2
#define BYLOCALE	-1
#define NODICT		0
#define DEFAULTDICT 1

#define MAXNDICT	2
typedef int2 MAPDICT[MAXNDICT];

#define GETDICT(x,i)	*( ((int2*)(x)) + (i) )

/* map dictionaries for lexem type */
static MAPDICT mapdict[] = {
	{NODICT, NODICT},			/* not used			*/
	{DEFAULTDICT, NODICT},		/* LATWORD		*/
	{BYLOCALE, NODICT},			/* NONLATINWORD		*/
	{BYLOCALE, DEFAULTDICT},	/* UWORD		*/
	{NODICT, NODICT},			/* EMAIL		*/
	{NODICT, NODICT},			/* FURL			*/
	{NODICT, NODICT},			/* HOST			*/
	{NODICT, NODICT},			/* SCIENTIFIC		*/
	{NODICT, NODICT},			/* VERSIONNUMBER		*/
	{BYLOCALE, DEFAULTDICT},	/* PARTHYPHENWORD		*/
	{BYLOCALE, NODICT},			/* CYRPARTHYPHENWORD */
	{DEFAULTDICT, NODICT},		/* LATPARTHYPHENWORD		*/
	{STOPLEXEM, NODICT},		/* SPACE		*/
	{STOPLEXEM, NODICT},		/* TAG		*/
	{STOPLEXEM, NODICT},		/* HTTP			*/
	{BYLOCALE, DEFAULTDICT},	/* HYPHENWORD		*/
	{DEFAULTDICT, NODICT},		/* LATHYPHENWORD		*/
	{BYLOCALE, NODICT},			/* CYRHYPHENWORD	*/
	{NODICT, NODICT},			/* URI			*/
	{NODICT, NODICT},			/* FILEPATH		*/
	{NODICT, NODICT},			/* DECIMAL		*/
	{NODICT, NODICT},			/* SIGNEDINT		*/
	{NODICT, NODICT},			/* UNSIGNEDINT		*/
	{STOPLEXEM, NODICT}			/* HTMLENTITY		*/
};

static bool inited = false;

void
initmorph(void)
{
	int			i,
				j,
				k;
	MAPDICT    *md;
	bool		needinit[lengthof(dicts)];
	const char *curlocale;
	int			bylocaledict = NODICT;

	if (inited)
		return;
	for (i = 1; i < lengthof(dicts); i++)
		needinit[i] = false;

	curlocale = setlocale(LC_CTYPE, NULL);
	if (curlocale)
	{
		for (i = 1; i < lengthof(dicts); i++)
			if (strcmp(dicts[i].localename, curlocale) == 0)
			{
				bylocaledict = i;
				break;
			}
	}

	for (i = 1; i < lengthof(mapdict); i++)
	{
		k = 0;
		md = &mapdict[i];
		for (j = 0; j < MAXNDICT; j++)
		{
			GETDICT(md, k) = GETDICT(md, j);
			if (GETDICT(md, k) == NODICT)
				break;
			else if (GETDICT(md, k) == BYLOCALE)
			{
				if (bylocaledict == NODICT)
					continue;
				GETDICT(md, k) = bylocaledict;
			}
			if (GETDICT(md, k) >= (int2) lengthof(dicts))
				continue;
			needinit[GETDICT(md, k)] = true;
			k++;
		}
		for (; k < MAXNDICT; k++)
			if (GETDICT(md, k) != STOPLEXEM)
				GETDICT(md, k) = NODICT;
	}

	for (i = 1; i < lengthof(dicts); i++)
		if (needinit[i] && dicts[i].init)
			dictobjs[i] = (*(dicts[i].init)) ();

	inited = true;
	return;
}

char *
lemmatize(char *word, int *len, int type)
{
	int2		nd;
	int			i;
	DICT	   *dict;

	for (i = 0; i < MAXNDICT; i++)
	{
		nd = GETDICT(&mapdict[type], i);
		if (nd == NODICT)
		{
			/* there is no dictionary */
			return word;
		}
		else if (nd == STOPLEXEM)
		{
			/* word is stopword */
			return NULL;
		}
		else if (nd == BYLOCALE)
		{
			continue;			/* no dict for current locale */
		}
		else
		{
			dict = &dicts[nd];
			if (dict->is_stoplemm && (*(dict->is_stoplemm)) (dictobjs[nd], word, *len))
				return NULL;
			if (dict->lemmatize)
			{
				int			oldlen = *len;
				char	   *newword = (*(dict->lemmatize)) (dictobjs[nd], word, len);

				/* word is recognized by dictionary */
				if (newword != word || *len != oldlen)
				{
					if (dict->is_stemstoplemm &&
					(*(dict->is_stemstoplemm)) (dictobjs[nd], word, *len))
					{
						if (newword != word && newword)
							pfree(newword);
						return NULL;
					}
					return newword;
				}
			}
		}
	}

	return word;
}

bool
is_stoptype(int type)
{
	return (GETDICT(&mapdict[type], 0) == STOPLEXEM) ? true : false;
}
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`/*`
			`* morphology module`
			`* New dictionary is include in dict.h. For languages which`
			`* use latin charset it may be need to modify mapdict table.`
			`* Teodor Sigaev <teodor@stack.net>`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`*/`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#include "postgres.h"`

Fix compile errors. 2002-09-06 04:51:39 +08:00			`#include <locale.h>`

txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#include "utils/builtins.h"`

			`#include "morph.h"`
			`#include "deflex.h"`

			`/*`
			`* Struct for calling dictionaries`
			`* All of this methods are optional, but`
			`* if all methods are NULL, then dictionary does nothing :)`
			`* Return value of lemmatize must be palloced or the same.`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`* Return value of init must be malloced in other case`
			`* it will be free in end of transaction!`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`*/`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`typedef struct`
			`{`
Fix compile errors. 2002-09-06 04:51:39 +08:00			`char localename[NAMEDATALEN];`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`/* init dictionary */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`void (init) (void);`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`/* close dictionary */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`void (close) (void );`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`/* find in dictionary */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`char (lemmatize) (void , char , int *);`
			`int (is_stoplemm) (void , char *, int);`
			`int (is_stemstoplemm) (void , char *, int);`
New pgindent run with fixes suggested by Tom. Patch manually reviewed, initdb/regression tests pass. 2001-11-06 01:46:40 +08:00			`} DICT;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
			`/* insert all dictionaries */`
			`#define DICT_BODY`
			`#include "dict.h"`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`#undef DICT_BODY`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`/* fill dictionary's structure */`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#define DICT_TABLE`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`DICT dicts[] = {`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`{`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`"C", NULL, NULL, NULL, NULL, NULL /* fake dictionary */`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`}`
			`#include "dict.h"`
			`};`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#undef DICT_TABLE`

Fix compile errors. 2002-09-06 04:51:39 +08:00			`/* array for storing dictionary's objects (if needed) */`
pgindent run. 2003-08-04 08:43:34 +08:00			`void *dictobjs[`
			`lengthof(dicts)];`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
			`#define STOPLEXEM -2`
			`#define BYLOCALE -1`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`#define NODICT 0`
			`#define DEFAULTDICT 1`

txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#define MAXNDICT 2`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`typedef int2 MAPDICT[MAXNDICT];`

txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`#define GETDICT(x,i) ( ((int2)(x)) + (i) )`

			`/* map dictionaries for lexem type */`
			`static MAPDICT mapdict[] = {`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`{NODICT, NODICT}, /* not used */`
			`{DEFAULTDICT, NODICT}, /* LATWORD */`
			`{BYLOCALE, NODICT}, /* NONLATINWORD */`
			`{BYLOCALE, DEFAULTDICT}, /* UWORD */`
			`{NODICT, NODICT}, /* EMAIL */`
			`{NODICT, NODICT}, /* FURL */`
			`{NODICT, NODICT}, /* HOST */`
August 13, 2002 Use parser of OpenFTS v0.33. -- Teodor Sigaev 2002-08-15 11:02:08 +08:00			`{NODICT, NODICT}, /* SCIENTIFIC */`
			`{NODICT, NODICT}, /* VERSIONNUMBER */`
			`{BYLOCALE, DEFAULTDICT}, /* PARTHYPHENWORD */`
			`{BYLOCALE, NODICT}, /* CYRPARTHYPHENWORD */`
			`{DEFAULTDICT, NODICT}, /* LATPARTHYPHENWORD */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`{STOPLEXEM, NODICT}, /* SPACE */`
August 13, 2002 Use parser of OpenFTS v0.33. -- Teodor Sigaev 2002-08-15 11:02:08 +08:00			`{STOPLEXEM, NODICT}, /* TAG */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`{STOPLEXEM, NODICT}, /* HTTP */`
August 13, 2002 Use parser of OpenFTS v0.33. -- Teodor Sigaev 2002-08-15 11:02:08 +08:00			`{BYLOCALE, DEFAULTDICT}, /* HYPHENWORD */`
			`{DEFAULTDICT, NODICT}, /* LATHYPHENWORD */`
			`{BYLOCALE, NODICT}, /* CYRHYPHENWORD */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`{NODICT, NODICT}, /* URI */`
August 13, 2002 Use parser of OpenFTS v0.33. -- Teodor Sigaev 2002-08-15 11:02:08 +08:00			`{NODICT, NODICT}, /* FILEPATH */`
			`{NODICT, NODICT}, /* DECIMAL */`
			`{NODICT, NODICT}, /* SIGNEDINT */`
			`{NODICT, NODICT}, /* UNSIGNEDINT */`
			`{STOPLEXEM, NODICT} /* HTMLENTITY */`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`};`

pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`static bool inited = false;`

			`void`
			`initmorph(void)`
			`{`
			`int i,`
			`j,`
			`k;`
			`MAPDICT *md;`
			`bool needinit[lengthof(dicts)];`
Fix compile errors. 2002-09-06 04:51:39 +08:00			`const char *curlocale;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`int bylocaledict = NODICT;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`if (inited)`
			`return;`
			`for (i = 1; i < lengthof(dicts); i++)`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`needinit[i] = false;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00
Fix compile errors. 2002-09-06 04:51:39 +08:00			`curlocale = setlocale(LC_CTYPE, NULL);`
			`if (curlocale)`
			`{`
Pleas apply it for 7.2.1 and current CVS. Patch fixes using lc.lang instead of lc.lc_ctype. Teodor Sigaev 2002-03-12 00:54:27 +08:00			`for (i = 1; i < lengthof(dicts); i++)`
Fix compile errors. 2002-09-06 04:51:39 +08:00			`if (strcmp(dicts[i].localename, curlocale) == 0)`
Pleas apply it for 7.2.1 and current CVS. Patch fixes using lc.lang instead of lc.lc_ctype. Teodor Sigaev 2002-03-12 00:54:27 +08:00			`{`
			`bylocaledict = i;`
			`break;`
			`}`
Fix compile errors. 2002-09-06 04:51:39 +08:00			`}`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`for (i = 1; i < lengthof(mapdict); i++)`
			`{`
			`k = 0;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`md = &mapdict[i];`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`for (j = 0; j < MAXNDICT; j++)`
			`{`
			`GETDICT(md, k) = GETDICT(md, j);`
			`if (GETDICT(md, k) == NODICT)`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`break;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`else if (GETDICT(md, k) == BYLOCALE)`
			`{`
			`if (bylocaledict == NODICT)`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`continue;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`GETDICT(md, k) = bylocaledict;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`}`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`if (GETDICT(md, k) >= (int2) lengthof(dicts))`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`continue;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`needinit[GETDICT(md, k)] = true;`
			`k++;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`}`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`for (; k < MAXNDICT; k++)`
			`if (GETDICT(md, k) != STOPLEXEM)`
			`GETDICT(md, k) = NODICT;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`}`

pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`for (i = 1; i < lengthof(dicts); i++)`
			`if (needinit[i] && dicts[i].init)`
			`dictobjs[i] = (*(dicts[i].init)) ();`

txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`inited = true;`
			`return;`
			`}`

pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`char *`
			`lemmatize(char word, int len, int type)`
			`{`
			`int2 nd;`
			`int i;`
			`DICT *dict;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`for (i = 0; i < MAXNDICT; i++)`
			`{`
			`nd = GETDICT(&mapdict[type], i);`
			`if (nd == NODICT)`
			`{`
			`/* there is no dictionary */`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`return word;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`}`
			`else if (nd == STOPLEXEM)`
			`{`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`/* word is stopword */`
			`return NULL;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`}`
Thank you very much, you catch it :). This bug had a long life, because it exists if and only if locale of postmaster was a different from C (or ru_RU.KOI8-R). Please, apply patch for current CVS & 7.3.1 Magnus Naeslund(f) wrote: > Ok, I nailed the bug, but i'm not sure what the correct fix is. > Attached tsearch_morph.diff that remedies this problem by avoiding it. > Also there's a debug aid patch if someone would like to know how i > finally found it out :) > > There problem in the lemmatize() function is that GETDICT(...) returned > a value not handled (BYLOCALE). > The value (-1) and later used as an index into the dicts[] array. > After that everything went berserk stack went crazy somehow so trapping > the fault sent me to the wrong place, and every time i read the value it > was positive ;) > > So now i just return the initial word passed to the lemmatize function, > because i don't know what to do with it. Magnus Naeslund 2002-12-06 13:15:02 +08:00			`else if (nd == BYLOCALE)`
			`{`
pgindent run. 2003-08-04 08:43:34 +08:00			`continue; /* no dict for current locale */`
Thank you very much, you catch it :). This bug had a long life, because it exists if and only if locale of postmaster was a different from C (or ru_RU.KOI8-R). Please, apply patch for current CVS & 7.3.1 Magnus Naeslund(f) wrote: > Ok, I nailed the bug, but i'm not sure what the correct fix is. > Attached tsearch_morph.diff that remedies this problem by avoiding it. > Also there's a debug aid patch if someone would like to know how i > finally found it out :) > > There problem in the lemmatize() function is that GETDICT(...) returned > a value not handled (BYLOCALE). > The value (-1) and later used as an index into the dicts[] array. > After that everything went berserk stack went crazy somehow so trapping > the fault sent me to the wrong place, and every time i read the value it > was positive ;) > > So now i just return the initial word passed to the lemmatize function, > because i don't know what to do with it. Magnus Naeslund 2002-12-06 13:15:02 +08:00			`}`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`else`
			`{`
			`dict = &dicts[nd];`
			`if (dict->is_stoplemm && ((dict->is_stoplemm)) (dictobjs[nd], word, len))`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`return NULL;`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`if (dict->lemmatize)`
			`{`
			`int oldlen = *len;`
			`char newword = ((dict->lemmatize)) (dictobjs[nd], word, len);`

This patch fixes a bunch of spelling mistakes in comments throughout the PostgreSQL source code. Neil Conway 2003-03-11 06:28:22 +08:00			`/* word is recognized by dictionary */`
pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`if (newword != word \|\| *len != oldlen)`
			`{`
			`if (dict->is_stemstoplemm &&`
			`((dict->is_stemstoplemm)) (dictobjs[nd], word, len))`
			`{`
			`if (newword != word && newword)`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`pfree(newword);`
			`return NULL;`
			`}`
			`return newword;`
			`}`
			`}`
			`}`
			`}`

			`return word;`
			`}`

pgindent run on all C files. Java run to follow. initdb/regression tests pass. 2001-10-25 13:50:21 +08:00			`bool`
			`is_stoptype(int type)`
			`{`
			`return (GETDICT(&mapdict[type], 0) == STOPLEXEM) ? true : false;`
txtidx datatype for full text indexing with GiST. From Oleg Bartunov and Teodor Sigaev. 2001-10-13 07:19:09 +08:00			`}`