2004-06-23 19:06:11 +08:00
|
|
|
#include "regis.h"
|
2005-12-21 21:05:49 +08:00
|
|
|
#include "ts_locale.h"
|
2004-06-23 19:06:11 +08:00
|
|
|
#include "common.h"
|
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
bool
|
2004-08-29 13:07:03 +08:00
|
|
|
RS_isRegis(const char *str)
|
|
|
|
{
|
2006-02-10 23:57:58 +08:00
|
|
|
while (str && *str)
|
|
|
|
{
|
|
|
|
if (t_isalpha(str) ||
|
|
|
|
t_iseq(str, '[') ||
|
2006-10-04 08:30:14 +08:00
|
|
|
t_iseq(str, ']') ||
|
2006-02-10 23:57:58 +08:00
|
|
|
t_iseq(str, '^'))
|
|
|
|
str += pg_mblen(str);
|
2004-06-23 19:06:11 +08:00
|
|
|
else
|
2005-12-21 21:05:49 +08:00
|
|
|
return false;
|
2006-02-10 23:57:58 +08:00
|
|
|
}
|
2005-12-21 21:05:49 +08:00
|
|
|
return true;
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
#define RS_IN_ONEOF 1
|
2004-06-23 19:06:11 +08:00
|
|
|
#define RS_IN_ONEOF_IN 2
|
|
|
|
#define RS_IN_NONEOF 3
|
|
|
|
#define RS_IN_WAIT 4
|
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
static RegisNode *
|
|
|
|
newRegisNode(RegisNode * prev, int len)
|
|
|
|
{
|
|
|
|
RegisNode *ptr;
|
|
|
|
|
|
|
|
ptr = (RegisNode *) malloc(RNHDRSZ + len + 1);
|
2004-06-23 19:06:11 +08:00
|
|
|
if (!ptr)
|
2004-08-29 13:07:03 +08:00
|
|
|
ts_error(ERROR, "No memory");
|
|
|
|
memset(ptr, 0, RNHDRSZ + len + 1);
|
2004-06-23 19:06:11 +08:00
|
|
|
if (prev)
|
2004-08-29 13:07:03 +08:00
|
|
|
prev->next = ptr;
|
2004-06-23 19:06:11 +08:00
|
|
|
return ptr;
|
|
|
|
}
|
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
void
|
|
|
|
RS_compile(Regis * r, bool issuffix, char *str)
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
int len = strlen(str);
|
2004-08-29 13:07:03 +08:00
|
|
|
int state = RS_IN_WAIT;
|
2006-10-04 08:30:14 +08:00
|
|
|
char *c = (char *) str;
|
2004-08-29 13:07:03 +08:00
|
|
|
RegisNode *ptr = NULL;
|
|
|
|
|
|
|
|
memset(r, 0, sizeof(Regis));
|
2004-06-23 19:06:11 +08:00
|
|
|
r->issuffix = (issuffix) ? 1 : 0;
|
|
|
|
|
2006-10-04 08:30:14 +08:00
|
|
|
while (*c)
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
|
|
|
if (state == RS_IN_WAIT)
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
if (t_isalpha(c))
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
|
|
|
if (ptr)
|
|
|
|
ptr = newRegisNode(ptr, len);
|
2004-06-23 19:06:11 +08:00
|
|
|
else
|
2004-08-29 13:07:03 +08:00
|
|
|
ptr = r->node = newRegisNode(NULL, len);
|
2005-12-21 21:05:49 +08:00
|
|
|
COPYCHAR(ptr->data, c);
|
2004-06-23 19:06:11 +08:00
|
|
|
ptr->type = RSF_ONEOF;
|
2005-12-21 21:05:49 +08:00
|
|
|
ptr->len = pg_mblen(c);
|
2004-08-29 13:07:03 +08:00
|
|
|
}
|
2006-10-04 08:30:14 +08:00
|
|
|
else if (t_iseq(c, '['))
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
|
|
|
if (ptr)
|
|
|
|
ptr = newRegisNode(ptr, len);
|
2004-06-23 19:06:11 +08:00
|
|
|
else
|
2004-08-29 13:07:03 +08:00
|
|
|
ptr = r->node = newRegisNode(NULL, len);
|
2004-06-23 19:06:11 +08:00
|
|
|
ptr->type = RSF_ONEOF;
|
2004-08-29 13:07:03 +08:00
|
|
|
state = RS_IN_ONEOF;
|
|
|
|
}
|
|
|
|
else
|
2006-10-04 08:30:14 +08:00
|
|
|
ts_error(ERROR, "Error in regis: %s", str);
|
2004-08-29 13:07:03 +08:00
|
|
|
}
|
|
|
|
else if (state == RS_IN_ONEOF)
|
|
|
|
{
|
2006-10-04 08:30:14 +08:00
|
|
|
if (t_iseq(c, '^'))
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
2004-06-23 19:06:11 +08:00
|
|
|
ptr->type = RSF_NONEOF;
|
2004-08-29 13:07:03 +08:00
|
|
|
state = RS_IN_NONEOF;
|
|
|
|
}
|
2005-12-21 21:05:49 +08:00
|
|
|
else if (t_isalpha(c))
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
COPYCHAR(ptr->data, c);
|
|
|
|
ptr->len = pg_mblen(c);
|
2004-08-29 13:07:03 +08:00
|
|
|
state = RS_IN_ONEOF_IN;
|
|
|
|
}
|
|
|
|
else
|
2005-12-21 21:05:49 +08:00
|
|
|
ts_error(ERROR, "Error in regis: %s", str);
|
2004-08-29 13:07:03 +08:00
|
|
|
}
|
|
|
|
else if (state == RS_IN_ONEOF_IN || state == RS_IN_NONEOF)
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
if (t_isalpha(c))
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
2006-10-04 08:30:14 +08:00
|
|
|
COPYCHAR(ptr->data + ptr->len, c);
|
|
|
|
ptr->len += pg_mblen(c);
|
2004-08-29 13:07:03 +08:00
|
|
|
}
|
2006-10-04 08:30:14 +08:00
|
|
|
else if (t_iseq(c, ']'))
|
2004-08-29 13:07:03 +08:00
|
|
|
state = RS_IN_WAIT;
|
|
|
|
else
|
2005-12-21 21:05:49 +08:00
|
|
|
ts_error(ERROR, "Error in regis: %s", str);
|
2004-08-29 13:07:03 +08:00
|
|
|
}
|
|
|
|
else
|
2005-12-21 21:05:49 +08:00
|
|
|
ts_error(ERROR, "Internal error in RS_compile: %d", state);
|
|
|
|
c += pg_mblen(c);
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
ptr = r->node;
|
2004-08-29 13:07:03 +08:00
|
|
|
while (ptr)
|
|
|
|
{
|
2004-06-23 19:06:11 +08:00
|
|
|
r->nchar++;
|
2004-08-29 13:07:03 +08:00
|
|
|
ptr = ptr->next;
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
void
|
|
|
|
RS_free(Regis * r)
|
|
|
|
{
|
|
|
|
RegisNode *ptr = r->node,
|
|
|
|
*tmp;
|
2004-06-23 19:06:11 +08:00
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
while (ptr)
|
|
|
|
{
|
|
|
|
tmp = ptr->next;
|
2004-06-23 19:06:11 +08:00
|
|
|
free(ptr);
|
|
|
|
ptr = tmp;
|
|
|
|
}
|
|
|
|
|
|
|
|
r->node = NULL;
|
|
|
|
}
|
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
#ifdef TS_USE_WIDE
|
|
|
|
static bool
|
2006-10-04 08:30:14 +08:00
|
|
|
mb_strchr(char *str, char *c)
|
|
|
|
{
|
|
|
|
int clen = pg_mblen(c),
|
|
|
|
plen,
|
|
|
|
i;
|
|
|
|
char *ptr = str;
|
|
|
|
bool res = false;
|
2005-12-21 21:05:49 +08:00
|
|
|
|
|
|
|
clen = pg_mblen(c);
|
2006-10-04 08:30:14 +08:00
|
|
|
while (*ptr && !res)
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
plen = pg_mblen(ptr);
|
2006-10-04 08:30:14 +08:00
|
|
|
if (plen == clen)
|
|
|
|
{
|
|
|
|
i = plen;
|
2005-12-21 21:05:49 +08:00
|
|
|
res = true;
|
2006-10-04 08:30:14 +08:00
|
|
|
while (i--)
|
|
|
|
if (*(ptr + i) != *(c + i))
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
res = false;
|
2006-10-04 08:30:14 +08:00
|
|
|
break;
|
2005-12-21 21:05:49 +08:00
|
|
|
}
|
|
|
|
}
|
2006-10-04 08:30:14 +08:00
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
ptr += plen;
|
2006-10-04 08:30:14 +08:00
|
|
|
}
|
2005-12-21 21:05:49 +08:00
|
|
|
|
2006-10-04 08:30:14 +08:00
|
|
|
return res;
|
2005-12-21 21:05:49 +08:00
|
|
|
}
|
|
|
|
#else
|
|
|
|
#define mb_strchr(s,c) ( (strchr((s),*(c)) == NULL) ? false : true )
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
|
|
|
bool
|
|
|
|
RS_execute(Regis * r, char *str)
|
2004-08-29 13:07:03 +08:00
|
|
|
{
|
|
|
|
RegisNode *ptr = r->node;
|
2006-10-04 08:30:14 +08:00
|
|
|
char *c = str;
|
|
|
|
int len = 0;
|
2004-06-23 19:06:11 +08:00
|
|
|
|
2006-10-04 08:30:14 +08:00
|
|
|
while (*c)
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
len++;
|
|
|
|
c += pg_mblen(c);
|
2006-10-04 08:30:14 +08:00
|
|
|
}
|
2004-06-23 19:06:11 +08:00
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
if (len < r->nchar)
|
2006-11-22 02:31:28 +08:00
|
|
|
return false;
|
2004-06-23 19:06:11 +08:00
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
c = str;
|
2006-10-04 08:30:14 +08:00
|
|
|
if (r->issuffix)
|
|
|
|
{
|
2005-12-21 21:05:49 +08:00
|
|
|
len -= r->nchar;
|
2006-10-04 08:30:14 +08:00
|
|
|
while (len-- > 0)
|
2005-12-21 21:05:49 +08:00
|
|
|
c += pg_mblen(c);
|
|
|
|
}
|
|
|
|
|
2004-06-23 19:06:11 +08:00
|
|
|
|
2004-08-29 13:07:03 +08:00
|
|
|
while (ptr)
|
|
|
|
{
|
|
|
|
switch (ptr->type)
|
|
|
|
{
|
2004-06-23 19:06:11 +08:00
|
|
|
case RSF_ONEOF:
|
2006-10-04 08:30:14 +08:00
|
|
|
if (mb_strchr((char *) ptr->data, c) != true)
|
2005-12-21 21:05:49 +08:00
|
|
|
return false;
|
2004-06-23 19:06:11 +08:00
|
|
|
break;
|
|
|
|
case RSF_NONEOF:
|
2006-10-04 08:30:14 +08:00
|
|
|
if (mb_strchr((char *) ptr->data, c) == true)
|
2005-12-21 21:05:49 +08:00
|
|
|
return false;
|
2004-06-23 19:06:11 +08:00
|
|
|
break;
|
|
|
|
default:
|
2004-08-29 13:07:03 +08:00
|
|
|
ts_error(ERROR, "RS_execute: Unknown type node: %d\n", ptr->type);
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|
2004-08-29 13:07:03 +08:00
|
|
|
ptr = ptr->next;
|
2006-10-04 08:30:14 +08:00
|
|
|
c += pg_mblen(c);
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|
|
|
|
|
2005-12-21 21:05:49 +08:00
|
|
|
return true;
|
2004-06-23 19:06:11 +08:00
|
|
|
}
|