postgresql/contrib/tsearch2/stopword.c

119 lines
2.1 KiB
C
Raw Normal View History

2003-08-04 02:43:34 +02:00
/*
2003-07-21 12:27:44 +02:00
* stopword library
* Teodor Sigaev <teodor@sigaev.ru>
*/
#include "postgres.h"
2003-07-21 12:27:44 +02:00
#include "common.h"
#include "dict.h"
#include "ts_locale.h"
2003-07-21 12:27:44 +02:00
#define STOPBUFLEN 4096
void
2003-08-04 02:43:34 +02:00
freestoplist(StopList * s)
{
char **ptr = s->stop;
if (ptr)
while (*ptr && s->len > 0)
{
2003-07-21 12:27:44 +02:00
free(*ptr);
2003-08-04 02:43:34 +02:00
ptr++;
s->len--;
free(s->stop);
}
memset(s, 0, sizeof(StopList));
2003-07-21 12:27:44 +02:00
}
void
2003-08-04 02:43:34 +02:00
readstoplist(text *in, StopList * s)
{
char **stop = NULL;
s->len = 0;
if (in && VARSIZE(in) - VARHDRSZ > 0)
{
char *filename = to_absfilename(text2char(in));
FILE *hin;
char buf[STOPBUFLEN], *pbuf;
2003-08-04 02:43:34 +02:00
int reallen = 0;
if ((hin = fopen(filename, "r")) == NULL)
ereport(ERROR,
(errcode(ERRCODE_CONFIG_FILE_ERROR),
errmsg("could not open file \"%s\": %m",
2003-08-04 02:43:34 +02:00
filename)));
while (fgets(buf, sizeof(buf), hin))
2003-08-04 02:43:34 +02:00
{
pbuf = buf;
while( *pbuf && !isspace((unsigned char) *pbuf ) )
pbuf++;
*pbuf = '\0';
2006-10-04 02:30:14 +02:00
pg_verifymbstr(buf, strlen(buf), false);
if (*buf == '\0' || *buf=='\n' || *buf=='\r')
2003-08-04 02:43:34 +02:00
continue;
2003-07-21 12:27:44 +02:00
2003-08-04 02:43:34 +02:00
if (s->len >= reallen)
{
char **tmp;
reallen = (reallen) ? reallen * 2 : 16;
tmp = (char **) realloc((void *) stop, sizeof(char *) * reallen);
if (!tmp)
{
2003-07-21 12:27:44 +02:00
freestoplist(s);
2003-08-04 02:43:34 +02:00
fclose(hin);
ereport(ERROR,
(errcode(ERRCODE_OUT_OF_MEMORY),
errmsg("out of memory")));
2003-07-21 12:27:44 +02:00
}
2003-08-04 02:43:34 +02:00
stop = tmp;
2003-07-21 12:27:44 +02:00
}
2003-08-04 02:43:34 +02:00
if (s->wordop)
{
pbuf = s->wordop(buf);
stop[s->len] = strdup(pbuf);
pfree(pbuf);
} else
stop[s->len] = strdup(buf);
2003-08-04 02:43:34 +02:00
if (!stop[s->len])
{
2003-07-21 12:27:44 +02:00
freestoplist(s);
2003-08-04 02:43:34 +02:00
fclose(hin);
ereport(ERROR,
(errcode(ERRCODE_OUT_OF_MEMORY),
errmsg("out of memory")));
2003-07-21 12:27:44 +02:00
}
2003-08-04 02:43:34 +02:00
(s->len)++;
2003-07-21 12:27:44 +02:00
}
fclose(hin);
2003-08-04 02:43:34 +02:00
pfree(filename);
2003-07-21 12:27:44 +02:00
}
2003-08-04 02:43:34 +02:00
s->stop = stop;
}
2003-07-21 12:27:44 +02:00
static int
2003-08-04 02:43:34 +02:00
comparestr(const void *a, const void *b)
{
return strcmp(*(char **) a, *(char **) b);
2003-07-21 12:27:44 +02:00
}
void
2003-08-04 02:43:34 +02:00
sortstoplist(StopList * s)
{
if (s->stop && s->len > 0)
qsort(s->stop, s->len, sizeof(char *), comparestr);
2003-07-21 12:27:44 +02:00
}
bool
2003-08-04 02:43:34 +02:00
searchstoplist(StopList * s, char *key)
{
return (s->stop && s->len > 0 && bsearch(&key, s->stop, s->len, sizeof(char *), comparestr)) ? true : false;
2003-07-21 12:27:44 +02:00
}