Snowball multibyte. It's a pity, but snowball sources is very diferent for multibyte and
singlebyte encodings, so we should have snowball for every encodings. I hope that finalize multibyte support work in tsearch2, but testing is needed...
This commit is contained in:
parent
75c4747156
commit
5e2707c45f
@ -1,4 +1,4 @@
|
|||||||
# $PostgreSQL: pgsql/contrib/tsearch2/Makefile,v 1.12 2005/11/21 12:27:57 teodor Exp $
|
# $PostgreSQL: pgsql/contrib/tsearch2/Makefile,v 1.13 2006/01/27 16:32:31 teodor Exp $
|
||||||
|
|
||||||
MODULE_big = tsearch2
|
MODULE_big = tsearch2
|
||||||
OBJS = dict_ex.o dict.o snmap.o stopword.o common.o prs_dcfg.o \
|
OBJS = dict_ex.o dict.o snmap.o stopword.o common.o prs_dcfg.o \
|
||||||
@ -16,7 +16,7 @@ OBJS += $(SUBDIROBJS)
|
|||||||
|
|
||||||
PG_CPPFLAGS = -I$(srcdir)/snowball -I$(srcdir)/ispell -I$(srcdir)/wordparser
|
PG_CPPFLAGS = -I$(srcdir)/snowball -I$(srcdir)/ispell -I$(srcdir)/wordparser
|
||||||
|
|
||||||
DATA = stopword/english.stop stopword/russian.stop
|
DATA = stopword/english.stop stopword/russian.stop stopword/russian.stop.utf8
|
||||||
DATA_built = tsearch2.sql untsearch2.sql
|
DATA_built = tsearch2.sql untsearch2.sql
|
||||||
DOCS = README.tsearch2
|
DOCS = README.tsearch2
|
||||||
REGRESS = tsearch2
|
REGRESS = tsearch2
|
||||||
|
@ -10,6 +10,7 @@
|
|||||||
#include "snowball/header.h"
|
#include "snowball/header.h"
|
||||||
#include "snowball/english_stem.h"
|
#include "snowball/english_stem.h"
|
||||||
#include "snowball/russian_stem.h"
|
#include "snowball/russian_stem.h"
|
||||||
|
#include "snowball/russian_stem_UTF8.h"
|
||||||
#include "ts_locale.h"
|
#include "ts_locale.h"
|
||||||
|
|
||||||
typedef struct
|
typedef struct
|
||||||
@ -23,8 +24,11 @@ typedef struct
|
|||||||
PG_FUNCTION_INFO_V1(snb_en_init);
|
PG_FUNCTION_INFO_V1(snb_en_init);
|
||||||
Datum snb_en_init(PG_FUNCTION_ARGS);
|
Datum snb_en_init(PG_FUNCTION_ARGS);
|
||||||
|
|
||||||
PG_FUNCTION_INFO_V1(snb_ru_init);
|
PG_FUNCTION_INFO_V1(snb_ru_init_koi8);
|
||||||
Datum snb_ru_init(PG_FUNCTION_ARGS);
|
Datum snb_ru_init_koi8(PG_FUNCTION_ARGS);
|
||||||
|
|
||||||
|
PG_FUNCTION_INFO_V1(snb_ru_init_utf8);
|
||||||
|
Datum snb_ru_init_utf8(PG_FUNCTION_ARGS);
|
||||||
|
|
||||||
PG_FUNCTION_INFO_V1(snb_lexize);
|
PG_FUNCTION_INFO_V1(snb_lexize);
|
||||||
Datum snb_lexize(PG_FUNCTION_ARGS);
|
Datum snb_lexize(PG_FUNCTION_ARGS);
|
||||||
@ -64,7 +68,7 @@ snb_en_init(PG_FUNCTION_ARGS)
|
|||||||
}
|
}
|
||||||
|
|
||||||
Datum
|
Datum
|
||||||
snb_ru_init(PG_FUNCTION_ARGS)
|
snb_ru_init_koi8(PG_FUNCTION_ARGS)
|
||||||
{
|
{
|
||||||
DictSnowball *d = (DictSnowball *) malloc(sizeof(DictSnowball));
|
DictSnowball *d = (DictSnowball *) malloc(sizeof(DictSnowball));
|
||||||
|
|
||||||
@ -97,6 +101,40 @@ snb_ru_init(PG_FUNCTION_ARGS)
|
|||||||
PG_RETURN_POINTER(d);
|
PG_RETURN_POINTER(d);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Datum
|
||||||
|
snb_ru_init_utf8(PG_FUNCTION_ARGS)
|
||||||
|
{
|
||||||
|
DictSnowball *d = (DictSnowball *) malloc(sizeof(DictSnowball));
|
||||||
|
|
||||||
|
if (!d)
|
||||||
|
ereport(ERROR,
|
||||||
|
(errcode(ERRCODE_OUT_OF_MEMORY),
|
||||||
|
errmsg("out of memory")));
|
||||||
|
memset(d, 0, sizeof(DictSnowball));
|
||||||
|
d->stoplist.wordop = lowerstr;
|
||||||
|
|
||||||
|
if (!PG_ARGISNULL(0) && PG_GETARG_POINTER(0) != NULL)
|
||||||
|
{
|
||||||
|
text *in = PG_GETARG_TEXT_P(0);
|
||||||
|
|
||||||
|
readstoplist(in, &(d->stoplist));
|
||||||
|
sortstoplist(&(d->stoplist));
|
||||||
|
PG_FREE_IF_COPY(in, 0);
|
||||||
|
}
|
||||||
|
|
||||||
|
d->z = russian_UTF_8_create_env();
|
||||||
|
if (!d->z)
|
||||||
|
{
|
||||||
|
freestoplist(&(d->stoplist));
|
||||||
|
ereport(ERROR,
|
||||||
|
(errcode(ERRCODE_OUT_OF_MEMORY),
|
||||||
|
errmsg("out of memory")));
|
||||||
|
}
|
||||||
|
d->stem = russian_UTF_8_stem;
|
||||||
|
|
||||||
|
PG_RETURN_POINTER(d);
|
||||||
|
}
|
||||||
|
|
||||||
Datum
|
Datum
|
||||||
snb_lexize(PG_FUNCTION_ARGS)
|
snb_lexize(PG_FUNCTION_ARGS)
|
||||||
{
|
{
|
||||||
|
@ -4,21 +4,21 @@
|
|||||||
--
|
--
|
||||||
\set ECHO none
|
\set ECHO none
|
||||||
psql:tsearch2.sql:13: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_dict_pkey" for table "pg_ts_dict"
|
psql:tsearch2.sql:13: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_dict_pkey" for table "pg_ts_dict"
|
||||||
psql:tsearch2.sql:145: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_parser_pkey" for table "pg_ts_parser"
|
psql:tsearch2.sql:158: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_parser_pkey" for table "pg_ts_parser"
|
||||||
psql:tsearch2.sql:244: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_cfg_pkey" for table "pg_ts_cfg"
|
psql:tsearch2.sql:257: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_cfg_pkey" for table "pg_ts_cfg"
|
||||||
psql:tsearch2.sql:251: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_cfgmap_pkey" for table "pg_ts_cfgmap"
|
psql:tsearch2.sql:264: NOTICE: CREATE TABLE / PRIMARY KEY will create implicit index "pg_ts_cfgmap_pkey" for table "pg_ts_cfgmap"
|
||||||
psql:tsearch2.sql:337: NOTICE: type "tsvector" is not yet defined
|
psql:tsearch2.sql:370: NOTICE: type "tsvector" is not yet defined
|
||||||
DETAIL: Creating a shell type definition.
|
DETAIL: Creating a shell type definition.
|
||||||
psql:tsearch2.sql:342: NOTICE: argument type tsvector is only a shell
|
psql:tsearch2.sql:375: NOTICE: argument type tsvector is only a shell
|
||||||
psql:tsearch2.sql:396: NOTICE: type "tsquery" is not yet defined
|
psql:tsearch2.sql:429: NOTICE: type "tsquery" is not yet defined
|
||||||
DETAIL: Creating a shell type definition.
|
DETAIL: Creating a shell type definition.
|
||||||
psql:tsearch2.sql:401: NOTICE: argument type tsquery is only a shell
|
psql:tsearch2.sql:434: NOTICE: argument type tsquery is only a shell
|
||||||
psql:tsearch2.sql:559: NOTICE: type "gtsvector" is not yet defined
|
psql:tsearch2.sql:592: NOTICE: type "gtsvector" is not yet defined
|
||||||
DETAIL: Creating a shell type definition.
|
DETAIL: Creating a shell type definition.
|
||||||
psql:tsearch2.sql:564: NOTICE: argument type gtsvector is only a shell
|
psql:tsearch2.sql:597: NOTICE: argument type gtsvector is only a shell
|
||||||
psql:tsearch2.sql:1054: NOTICE: type "gtsq" is not yet defined
|
psql:tsearch2.sql:1087: NOTICE: type "gtsq" is not yet defined
|
||||||
DETAIL: Creating a shell type definition.
|
DETAIL: Creating a shell type definition.
|
||||||
psql:tsearch2.sql:1059: NOTICE: argument type gtsq is only a shell
|
psql:tsearch2.sql:1092: NOTICE: argument type gtsq is only a shell
|
||||||
--tsvector
|
--tsvector
|
||||||
SELECT '1'::tsvector;
|
SELECT '1'::tsvector;
|
||||||
tsvector
|
tsvector
|
||||||
|
@ -1,6 +1,6 @@
|
|||||||
# $PostgreSQL: pgsql/contrib/tsearch2/snowball/Makefile,v 1.8 2005/10/18 01:30:48 tgl Exp $
|
# $PostgreSQL: pgsql/contrib/tsearch2/snowball/Makefile,v 1.9 2006/01/27 16:32:31 teodor Exp $
|
||||||
|
|
||||||
SUBOBJS = english_stem.o api.o russian_stem.o utilities.o
|
SUBOBJS = english_stem.o api.o russian_stem.o russian_stem_UTF8.o utilities.o
|
||||||
|
|
||||||
EXTRA_CLEAN = SUBSYS.o $(SUBOBJS)
|
EXTRA_CLEAN = SUBSYS.o $(SUBOBJS)
|
||||||
|
|
||||||
|
709
contrib/tsearch2/snowball/russian_stem_UTF8.c
Normal file
709
contrib/tsearch2/snowball/russian_stem_UTF8.c
Normal file
@ -0,0 +1,709 @@
|
|||||||
|
|
||||||
|
/* This file was generated automatically by the Snowball to ANSI C compiler */
|
||||||
|
|
||||||
|
#include "header.h"
|
||||||
|
|
||||||
|
extern int russian_UTF_8_stem(struct SN_env * z);
|
||||||
|
static int r_tidy_up(struct SN_env * z);
|
||||||
|
static int r_derivational(struct SN_env * z);
|
||||||
|
static int r_noun(struct SN_env * z);
|
||||||
|
static int r_verb(struct SN_env * z);
|
||||||
|
static int r_reflexive(struct SN_env * z);
|
||||||
|
static int r_adjectival(struct SN_env * z);
|
||||||
|
static int r_adjective(struct SN_env * z);
|
||||||
|
static int r_perfective_gerund(struct SN_env * z);
|
||||||
|
static int r_R2(struct SN_env * z);
|
||||||
|
static int r_mark_regions(struct SN_env * z);
|
||||||
|
|
||||||
|
extern struct SN_env * russian_UTF_8_create_env(void);
|
||||||
|
extern void russian_UTF_8_close_env(struct SN_env * z);
|
||||||
|
|
||||||
|
static symbol s_0_0[10] = { 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8, 0xD1, 0x81, 0xD1, 0x8C };
|
||||||
|
static symbol s_0_1[12] = { 0xD1, 0x8B, 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8, 0xD1, 0x81, 0xD1, 0x8C };
|
||||||
|
static symbol s_0_2[12] = { 0xD0, 0xB8, 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8, 0xD1, 0x81, 0xD1, 0x8C };
|
||||||
|
static symbol s_0_3[2] = { 0xD0, 0xB2 };
|
||||||
|
static symbol s_0_4[4] = { 0xD1, 0x8B, 0xD0, 0xB2 };
|
||||||
|
static symbol s_0_5[4] = { 0xD0, 0xB8, 0xD0, 0xB2 };
|
||||||
|
static symbol s_0_6[6] = { 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8 };
|
||||||
|
static symbol s_0_7[8] = { 0xD1, 0x8B, 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8 };
|
||||||
|
static symbol s_0_8[8] = { 0xD0, 0xB8, 0xD0, 0xB2, 0xD1, 0x88, 0xD0, 0xB8 };
|
||||||
|
|
||||||
|
static struct among a_0[9] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 10, s_0_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 12, s_0_1, 0, 2, 0},
|
||||||
|
/* 2 */ { 12, s_0_2, 0, 2, 0},
|
||||||
|
/* 3 */ { 2, s_0_3, -1, 1, 0},
|
||||||
|
/* 4 */ { 4, s_0_4, 3, 2, 0},
|
||||||
|
/* 5 */ { 4, s_0_5, 3, 2, 0},
|
||||||
|
/* 6 */ { 6, s_0_6, -1, 1, 0},
|
||||||
|
/* 7 */ { 8, s_0_7, 6, 2, 0},
|
||||||
|
/* 8 */ { 8, s_0_8, 6, 2, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_1_0[6] = { 0xD0, 0xB5, 0xD0, 0xBC, 0xD1, 0x83 };
|
||||||
|
static symbol s_1_1[6] = { 0xD0, 0xBE, 0xD0, 0xBC, 0xD1, 0x83 };
|
||||||
|
static symbol s_1_2[4] = { 0xD1, 0x8B, 0xD1, 0x85 };
|
||||||
|
static symbol s_1_3[4] = { 0xD0, 0xB8, 0xD1, 0x85 };
|
||||||
|
static symbol s_1_4[4] = { 0xD1, 0x83, 0xD1, 0x8E };
|
||||||
|
static symbol s_1_5[4] = { 0xD1, 0x8E, 0xD1, 0x8E };
|
||||||
|
static symbol s_1_6[4] = { 0xD0, 0xB5, 0xD1, 0x8E };
|
||||||
|
static symbol s_1_7[4] = { 0xD0, 0xBE, 0xD1, 0x8E };
|
||||||
|
static symbol s_1_8[4] = { 0xD1, 0x8F, 0xD1, 0x8F };
|
||||||
|
static symbol s_1_9[4] = { 0xD0, 0xB0, 0xD1, 0x8F };
|
||||||
|
static symbol s_1_10[4] = { 0xD1, 0x8B, 0xD0, 0xB5 };
|
||||||
|
static symbol s_1_11[4] = { 0xD0, 0xB5, 0xD0, 0xB5 };
|
||||||
|
static symbol s_1_12[4] = { 0xD0, 0xB8, 0xD0, 0xB5 };
|
||||||
|
static symbol s_1_13[4] = { 0xD0, 0xBE, 0xD0, 0xB5 };
|
||||||
|
static symbol s_1_14[6] = { 0xD1, 0x8B, 0xD0, 0xBC, 0xD0, 0xB8 };
|
||||||
|
static symbol s_1_15[6] = { 0xD0, 0xB8, 0xD0, 0xBC, 0xD0, 0xB8 };
|
||||||
|
static symbol s_1_16[4] = { 0xD1, 0x8B, 0xD0, 0xB9 };
|
||||||
|
static symbol s_1_17[4] = { 0xD0, 0xB5, 0xD0, 0xB9 };
|
||||||
|
static symbol s_1_18[4] = { 0xD0, 0xB8, 0xD0, 0xB9 };
|
||||||
|
static symbol s_1_19[4] = { 0xD0, 0xBE, 0xD0, 0xB9 };
|
||||||
|
static symbol s_1_20[4] = { 0xD1, 0x8B, 0xD0, 0xBC };
|
||||||
|
static symbol s_1_21[4] = { 0xD0, 0xB5, 0xD0, 0xBC };
|
||||||
|
static symbol s_1_22[4] = { 0xD0, 0xB8, 0xD0, 0xBC };
|
||||||
|
static symbol s_1_23[4] = { 0xD0, 0xBE, 0xD0, 0xBC };
|
||||||
|
static symbol s_1_24[6] = { 0xD0, 0xB5, 0xD0, 0xB3, 0xD0, 0xBE };
|
||||||
|
static symbol s_1_25[6] = { 0xD0, 0xBE, 0xD0, 0xB3, 0xD0, 0xBE };
|
||||||
|
|
||||||
|
static struct among a_1[26] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 6, s_1_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 6, s_1_1, -1, 1, 0},
|
||||||
|
/* 2 */ { 4, s_1_2, -1, 1, 0},
|
||||||
|
/* 3 */ { 4, s_1_3, -1, 1, 0},
|
||||||
|
/* 4 */ { 4, s_1_4, -1, 1, 0},
|
||||||
|
/* 5 */ { 4, s_1_5, -1, 1, 0},
|
||||||
|
/* 6 */ { 4, s_1_6, -1, 1, 0},
|
||||||
|
/* 7 */ { 4, s_1_7, -1, 1, 0},
|
||||||
|
/* 8 */ { 4, s_1_8, -1, 1, 0},
|
||||||
|
/* 9 */ { 4, s_1_9, -1, 1, 0},
|
||||||
|
/* 10 */ { 4, s_1_10, -1, 1, 0},
|
||||||
|
/* 11 */ { 4, s_1_11, -1, 1, 0},
|
||||||
|
/* 12 */ { 4, s_1_12, -1, 1, 0},
|
||||||
|
/* 13 */ { 4, s_1_13, -1, 1, 0},
|
||||||
|
/* 14 */ { 6, s_1_14, -1, 1, 0},
|
||||||
|
/* 15 */ { 6, s_1_15, -1, 1, 0},
|
||||||
|
/* 16 */ { 4, s_1_16, -1, 1, 0},
|
||||||
|
/* 17 */ { 4, s_1_17, -1, 1, 0},
|
||||||
|
/* 18 */ { 4, s_1_18, -1, 1, 0},
|
||||||
|
/* 19 */ { 4, s_1_19, -1, 1, 0},
|
||||||
|
/* 20 */ { 4, s_1_20, -1, 1, 0},
|
||||||
|
/* 21 */ { 4, s_1_21, -1, 1, 0},
|
||||||
|
/* 22 */ { 4, s_1_22, -1, 1, 0},
|
||||||
|
/* 23 */ { 4, s_1_23, -1, 1, 0},
|
||||||
|
/* 24 */ { 6, s_1_24, -1, 1, 0},
|
||||||
|
/* 25 */ { 6, s_1_25, -1, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_2_0[4] = { 0xD0, 0xB2, 0xD1, 0x88 };
|
||||||
|
static symbol s_2_1[6] = { 0xD1, 0x8B, 0xD0, 0xB2, 0xD1, 0x88 };
|
||||||
|
static symbol s_2_2[6] = { 0xD0, 0xB8, 0xD0, 0xB2, 0xD1, 0x88 };
|
||||||
|
static symbol s_2_3[2] = { 0xD1, 0x89 };
|
||||||
|
static symbol s_2_4[4] = { 0xD1, 0x8E, 0xD1, 0x89 };
|
||||||
|
static symbol s_2_5[6] = { 0xD1, 0x83, 0xD1, 0x8E, 0xD1, 0x89 };
|
||||||
|
static symbol s_2_6[4] = { 0xD0, 0xB5, 0xD0, 0xBC };
|
||||||
|
static symbol s_2_7[4] = { 0xD0, 0xBD, 0xD0, 0xBD };
|
||||||
|
|
||||||
|
static struct among a_2[8] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 4, s_2_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 6, s_2_1, 0, 2, 0},
|
||||||
|
/* 2 */ { 6, s_2_2, 0, 2, 0},
|
||||||
|
/* 3 */ { 2, s_2_3, -1, 1, 0},
|
||||||
|
/* 4 */ { 4, s_2_4, 3, 1, 0},
|
||||||
|
/* 5 */ { 6, s_2_5, 4, 2, 0},
|
||||||
|
/* 6 */ { 4, s_2_6, -1, 1, 0},
|
||||||
|
/* 7 */ { 4, s_2_7, -1, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_3_0[4] = { 0xD1, 0x81, 0xD1, 0x8C };
|
||||||
|
static symbol s_3_1[4] = { 0xD1, 0x81, 0xD1, 0x8F };
|
||||||
|
|
||||||
|
static struct among a_3[2] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 4, s_3_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 4, s_3_1, -1, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_4_0[4] = { 0xD1, 0x8B, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_1[4] = { 0xD1, 0x8E, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_2[6] = { 0xD1, 0x83, 0xD1, 0x8E, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_3[4] = { 0xD1, 0x8F, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_4[4] = { 0xD0, 0xB5, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_5[6] = { 0xD1, 0x83, 0xD0, 0xB5, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_6[4] = { 0xD0, 0xB8, 0xD1, 0x82 };
|
||||||
|
static symbol s_4_7[4] = { 0xD0, 0xBD, 0xD1, 0x8B };
|
||||||
|
static symbol s_4_8[6] = { 0xD0, 0xB5, 0xD0, 0xBD, 0xD1, 0x8B };
|
||||||
|
static symbol s_4_9[4] = { 0xD1, 0x82, 0xD1, 0x8C };
|
||||||
|
static symbol s_4_10[6] = { 0xD1, 0x8B, 0xD1, 0x82, 0xD1, 0x8C };
|
||||||
|
static symbol s_4_11[6] = { 0xD0, 0xB8, 0xD1, 0x82, 0xD1, 0x8C };
|
||||||
|
static symbol s_4_12[6] = { 0xD0, 0xB5, 0xD1, 0x88, 0xD1, 0x8C };
|
||||||
|
static symbol s_4_13[6] = { 0xD0, 0xB8, 0xD1, 0x88, 0xD1, 0x8C };
|
||||||
|
static symbol s_4_14[2] = { 0xD1, 0x8E };
|
||||||
|
static symbol s_4_15[4] = { 0xD1, 0x83, 0xD1, 0x8E };
|
||||||
|
static symbol s_4_16[4] = { 0xD0, 0xBB, 0xD0, 0xB0 };
|
||||||
|
static symbol s_4_17[6] = { 0xD1, 0x8B, 0xD0, 0xBB, 0xD0, 0xB0 };
|
||||||
|
static symbol s_4_18[6] = { 0xD0, 0xB8, 0xD0, 0xBB, 0xD0, 0xB0 };
|
||||||
|
static symbol s_4_19[4] = { 0xD0, 0xBD, 0xD0, 0xB0 };
|
||||||
|
static symbol s_4_20[6] = { 0xD0, 0xB5, 0xD0, 0xBD, 0xD0, 0xB0 };
|
||||||
|
static symbol s_4_21[6] = { 0xD0, 0xB5, 0xD1, 0x82, 0xD0, 0xB5 };
|
||||||
|
static symbol s_4_22[6] = { 0xD0, 0xB8, 0xD1, 0x82, 0xD0, 0xB5 };
|
||||||
|
static symbol s_4_23[6] = { 0xD0, 0xB9, 0xD1, 0x82, 0xD0, 0xB5 };
|
||||||
|
static symbol s_4_24[8] = { 0xD1, 0x83, 0xD0, 0xB9, 0xD1, 0x82, 0xD0, 0xB5 };
|
||||||
|
static symbol s_4_25[8] = { 0xD0, 0xB5, 0xD0, 0xB9, 0xD1, 0x82, 0xD0, 0xB5 };
|
||||||
|
static symbol s_4_26[4] = { 0xD0, 0xBB, 0xD0, 0xB8 };
|
||||||
|
static symbol s_4_27[6] = { 0xD1, 0x8B, 0xD0, 0xBB, 0xD0, 0xB8 };
|
||||||
|
static symbol s_4_28[6] = { 0xD0, 0xB8, 0xD0, 0xBB, 0xD0, 0xB8 };
|
||||||
|
static symbol s_4_29[2] = { 0xD0, 0xB9 };
|
||||||
|
static symbol s_4_30[4] = { 0xD1, 0x83, 0xD0, 0xB9 };
|
||||||
|
static symbol s_4_31[4] = { 0xD0, 0xB5, 0xD0, 0xB9 };
|
||||||
|
static symbol s_4_32[2] = { 0xD0, 0xBB };
|
||||||
|
static symbol s_4_33[4] = { 0xD1, 0x8B, 0xD0, 0xBB };
|
||||||
|
static symbol s_4_34[4] = { 0xD0, 0xB8, 0xD0, 0xBB };
|
||||||
|
static symbol s_4_35[4] = { 0xD1, 0x8B, 0xD0, 0xBC };
|
||||||
|
static symbol s_4_36[4] = { 0xD0, 0xB5, 0xD0, 0xBC };
|
||||||
|
static symbol s_4_37[4] = { 0xD0, 0xB8, 0xD0, 0xBC };
|
||||||
|
static symbol s_4_38[2] = { 0xD0, 0xBD };
|
||||||
|
static symbol s_4_39[4] = { 0xD0, 0xB5, 0xD0, 0xBD };
|
||||||
|
static symbol s_4_40[4] = { 0xD0, 0xBB, 0xD0, 0xBE };
|
||||||
|
static symbol s_4_41[6] = { 0xD1, 0x8B, 0xD0, 0xBB, 0xD0, 0xBE };
|
||||||
|
static symbol s_4_42[6] = { 0xD0, 0xB8, 0xD0, 0xBB, 0xD0, 0xBE };
|
||||||
|
static symbol s_4_43[4] = { 0xD0, 0xBD, 0xD0, 0xBE };
|
||||||
|
static symbol s_4_44[6] = { 0xD0, 0xB5, 0xD0, 0xBD, 0xD0, 0xBE };
|
||||||
|
static symbol s_4_45[6] = { 0xD0, 0xBD, 0xD0, 0xBD, 0xD0, 0xBE };
|
||||||
|
|
||||||
|
static struct among a_4[46] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 4, s_4_0, -1, 2, 0},
|
||||||
|
/* 1 */ { 4, s_4_1, -1, 1, 0},
|
||||||
|
/* 2 */ { 6, s_4_2, 1, 2, 0},
|
||||||
|
/* 3 */ { 4, s_4_3, -1, 2, 0},
|
||||||
|
/* 4 */ { 4, s_4_4, -1, 1, 0},
|
||||||
|
/* 5 */ { 6, s_4_5, 4, 2, 0},
|
||||||
|
/* 6 */ { 4, s_4_6, -1, 2, 0},
|
||||||
|
/* 7 */ { 4, s_4_7, -1, 1, 0},
|
||||||
|
/* 8 */ { 6, s_4_8, 7, 2, 0},
|
||||||
|
/* 9 */ { 4, s_4_9, -1, 1, 0},
|
||||||
|
/* 10 */ { 6, s_4_10, 9, 2, 0},
|
||||||
|
/* 11 */ { 6, s_4_11, 9, 2, 0},
|
||||||
|
/* 12 */ { 6, s_4_12, -1, 1, 0},
|
||||||
|
/* 13 */ { 6, s_4_13, -1, 2, 0},
|
||||||
|
/* 14 */ { 2, s_4_14, -1, 2, 0},
|
||||||
|
/* 15 */ { 4, s_4_15, 14, 2, 0},
|
||||||
|
/* 16 */ { 4, s_4_16, -1, 1, 0},
|
||||||
|
/* 17 */ { 6, s_4_17, 16, 2, 0},
|
||||||
|
/* 18 */ { 6, s_4_18, 16, 2, 0},
|
||||||
|
/* 19 */ { 4, s_4_19, -1, 1, 0},
|
||||||
|
/* 20 */ { 6, s_4_20, 19, 2, 0},
|
||||||
|
/* 21 */ { 6, s_4_21, -1, 1, 0},
|
||||||
|
/* 22 */ { 6, s_4_22, -1, 2, 0},
|
||||||
|
/* 23 */ { 6, s_4_23, -1, 1, 0},
|
||||||
|
/* 24 */ { 8, s_4_24, 23, 2, 0},
|
||||||
|
/* 25 */ { 8, s_4_25, 23, 2, 0},
|
||||||
|
/* 26 */ { 4, s_4_26, -1, 1, 0},
|
||||||
|
/* 27 */ { 6, s_4_27, 26, 2, 0},
|
||||||
|
/* 28 */ { 6, s_4_28, 26, 2, 0},
|
||||||
|
/* 29 */ { 2, s_4_29, -1, 1, 0},
|
||||||
|
/* 30 */ { 4, s_4_30, 29, 2, 0},
|
||||||
|
/* 31 */ { 4, s_4_31, 29, 2, 0},
|
||||||
|
/* 32 */ { 2, s_4_32, -1, 1, 0},
|
||||||
|
/* 33 */ { 4, s_4_33, 32, 2, 0},
|
||||||
|
/* 34 */ { 4, s_4_34, 32, 2, 0},
|
||||||
|
/* 35 */ { 4, s_4_35, -1, 2, 0},
|
||||||
|
/* 36 */ { 4, s_4_36, -1, 1, 0},
|
||||||
|
/* 37 */ { 4, s_4_37, -1, 2, 0},
|
||||||
|
/* 38 */ { 2, s_4_38, -1, 1, 0},
|
||||||
|
/* 39 */ { 4, s_4_39, 38, 2, 0},
|
||||||
|
/* 40 */ { 4, s_4_40, -1, 1, 0},
|
||||||
|
/* 41 */ { 6, s_4_41, 40, 2, 0},
|
||||||
|
/* 42 */ { 6, s_4_42, 40, 2, 0},
|
||||||
|
/* 43 */ { 4, s_4_43, -1, 1, 0},
|
||||||
|
/* 44 */ { 6, s_4_44, 43, 2, 0},
|
||||||
|
/* 45 */ { 6, s_4_45, 43, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_5_0[2] = { 0xD1, 0x83 };
|
||||||
|
static symbol s_5_1[4] = { 0xD1, 0x8F, 0xD1, 0x85 };
|
||||||
|
static symbol s_5_2[6] = { 0xD0, 0xB8, 0xD1, 0x8F, 0xD1, 0x85 };
|
||||||
|
static symbol s_5_3[4] = { 0xD0, 0xB0, 0xD1, 0x85 };
|
||||||
|
static symbol s_5_4[2] = { 0xD1, 0x8B };
|
||||||
|
static symbol s_5_5[2] = { 0xD1, 0x8C };
|
||||||
|
static symbol s_5_6[2] = { 0xD1, 0x8E };
|
||||||
|
static symbol s_5_7[4] = { 0xD1, 0x8C, 0xD1, 0x8E };
|
||||||
|
static symbol s_5_8[4] = { 0xD0, 0xB8, 0xD1, 0x8E };
|
||||||
|
static symbol s_5_9[2] = { 0xD1, 0x8F };
|
||||||
|
static symbol s_5_10[4] = { 0xD1, 0x8C, 0xD1, 0x8F };
|
||||||
|
static symbol s_5_11[4] = { 0xD0, 0xB8, 0xD1, 0x8F };
|
||||||
|
static symbol s_5_12[2] = { 0xD0, 0xB0 };
|
||||||
|
static symbol s_5_13[4] = { 0xD0, 0xB5, 0xD0, 0xB2 };
|
||||||
|
static symbol s_5_14[4] = { 0xD0, 0xBE, 0xD0, 0xB2 };
|
||||||
|
static symbol s_5_15[2] = { 0xD0, 0xB5 };
|
||||||
|
static symbol s_5_16[4] = { 0xD1, 0x8C, 0xD0, 0xB5 };
|
||||||
|
static symbol s_5_17[4] = { 0xD0, 0xB8, 0xD0, 0xB5 };
|
||||||
|
static symbol s_5_18[2] = { 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_19[4] = { 0xD0, 0xB5, 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_20[4] = { 0xD0, 0xB8, 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_21[6] = { 0xD1, 0x8F, 0xD0, 0xBC, 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_22[8] = { 0xD0, 0xB8, 0xD1, 0x8F, 0xD0, 0xBC, 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_23[6] = { 0xD0, 0xB0, 0xD0, 0xBC, 0xD0, 0xB8 };
|
||||||
|
static symbol s_5_24[2] = { 0xD0, 0xB9 };
|
||||||
|
static symbol s_5_25[4] = { 0xD0, 0xB5, 0xD0, 0xB9 };
|
||||||
|
static symbol s_5_26[6] = { 0xD0, 0xB8, 0xD0, 0xB5, 0xD0, 0xB9 };
|
||||||
|
static symbol s_5_27[4] = { 0xD0, 0xB8, 0xD0, 0xB9 };
|
||||||
|
static symbol s_5_28[4] = { 0xD0, 0xBE, 0xD0, 0xB9 };
|
||||||
|
static symbol s_5_29[4] = { 0xD1, 0x8F, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_30[6] = { 0xD0, 0xB8, 0xD1, 0x8F, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_31[4] = { 0xD0, 0xB0, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_32[4] = { 0xD0, 0xB5, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_33[6] = { 0xD0, 0xB8, 0xD0, 0xB5, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_34[4] = { 0xD0, 0xBE, 0xD0, 0xBC };
|
||||||
|
static symbol s_5_35[2] = { 0xD0, 0xBE };
|
||||||
|
|
||||||
|
static struct among a_5[36] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 2, s_5_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 4, s_5_1, -1, 1, 0},
|
||||||
|
/* 2 */ { 6, s_5_2, 1, 1, 0},
|
||||||
|
/* 3 */ { 4, s_5_3, -1, 1, 0},
|
||||||
|
/* 4 */ { 2, s_5_4, -1, 1, 0},
|
||||||
|
/* 5 */ { 2, s_5_5, -1, 1, 0},
|
||||||
|
/* 6 */ { 2, s_5_6, -1, 1, 0},
|
||||||
|
/* 7 */ { 4, s_5_7, 6, 1, 0},
|
||||||
|
/* 8 */ { 4, s_5_8, 6, 1, 0},
|
||||||
|
/* 9 */ { 2, s_5_9, -1, 1, 0},
|
||||||
|
/* 10 */ { 4, s_5_10, 9, 1, 0},
|
||||||
|
/* 11 */ { 4, s_5_11, 9, 1, 0},
|
||||||
|
/* 12 */ { 2, s_5_12, -1, 1, 0},
|
||||||
|
/* 13 */ { 4, s_5_13, -1, 1, 0},
|
||||||
|
/* 14 */ { 4, s_5_14, -1, 1, 0},
|
||||||
|
/* 15 */ { 2, s_5_15, -1, 1, 0},
|
||||||
|
/* 16 */ { 4, s_5_16, 15, 1, 0},
|
||||||
|
/* 17 */ { 4, s_5_17, 15, 1, 0},
|
||||||
|
/* 18 */ { 2, s_5_18, -1, 1, 0},
|
||||||
|
/* 19 */ { 4, s_5_19, 18, 1, 0},
|
||||||
|
/* 20 */ { 4, s_5_20, 18, 1, 0},
|
||||||
|
/* 21 */ { 6, s_5_21, 18, 1, 0},
|
||||||
|
/* 22 */ { 8, s_5_22, 21, 1, 0},
|
||||||
|
/* 23 */ { 6, s_5_23, 18, 1, 0},
|
||||||
|
/* 24 */ { 2, s_5_24, -1, 1, 0},
|
||||||
|
/* 25 */ { 4, s_5_25, 24, 1, 0},
|
||||||
|
/* 26 */ { 6, s_5_26, 25, 1, 0},
|
||||||
|
/* 27 */ { 4, s_5_27, 24, 1, 0},
|
||||||
|
/* 28 */ { 4, s_5_28, 24, 1, 0},
|
||||||
|
/* 29 */ { 4, s_5_29, -1, 1, 0},
|
||||||
|
/* 30 */ { 6, s_5_30, 29, 1, 0},
|
||||||
|
/* 31 */ { 4, s_5_31, -1, 1, 0},
|
||||||
|
/* 32 */ { 4, s_5_32, -1, 1, 0},
|
||||||
|
/* 33 */ { 6, s_5_33, 32, 1, 0},
|
||||||
|
/* 34 */ { 4, s_5_34, -1, 1, 0},
|
||||||
|
/* 35 */ { 2, s_5_35, -1, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_6_0[6] = { 0xD0, 0xBE, 0xD1, 0x81, 0xD1, 0x82 };
|
||||||
|
static symbol s_6_1[8] = { 0xD0, 0xBE, 0xD1, 0x81, 0xD1, 0x82, 0xD1, 0x8C };
|
||||||
|
|
||||||
|
static struct among a_6[2] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 6, s_6_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 8, s_6_1, -1, 1, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static symbol s_7_0[6] = { 0xD0, 0xB5, 0xD0, 0xB9, 0xD1, 0x88 };
|
||||||
|
static symbol s_7_1[2] = { 0xD1, 0x8C };
|
||||||
|
static symbol s_7_2[8] = { 0xD0, 0xB5, 0xD0, 0xB9, 0xD1, 0x88, 0xD0, 0xB5 };
|
||||||
|
static symbol s_7_3[2] = { 0xD0, 0xBD };
|
||||||
|
|
||||||
|
static struct among a_7[4] =
|
||||||
|
{
|
||||||
|
/* 0 */ { 6, s_7_0, -1, 1, 0},
|
||||||
|
/* 1 */ { 2, s_7_1, -1, 3, 0},
|
||||||
|
/* 2 */ { 8, s_7_2, -1, 1, 0},
|
||||||
|
/* 3 */ { 2, s_7_3, -1, 2, 0}
|
||||||
|
};
|
||||||
|
|
||||||
|
static unsigned char g_v[] = { 33, 65, 8, 232 };
|
||||||
|
|
||||||
|
static symbol s_0[] = { 0xD0, 0xB0 };
|
||||||
|
static symbol s_1[] = { 0xD1, 0x8F };
|
||||||
|
static symbol s_2[] = { 0xD0, 0xB0 };
|
||||||
|
static symbol s_3[] = { 0xD1, 0x8F };
|
||||||
|
static symbol s_4[] = { 0xD0, 0xB0 };
|
||||||
|
static symbol s_5[] = { 0xD1, 0x8F };
|
||||||
|
static symbol s_6[] = { 0xD0, 0xBD };
|
||||||
|
static symbol s_7[] = { 0xD0, 0xBD };
|
||||||
|
static symbol s_8[] = { 0xD0, 0xBD };
|
||||||
|
static symbol s_9[] = { 0xD0, 0xB8 };
|
||||||
|
|
||||||
|
static int r_mark_regions(struct SN_env * z) {
|
||||||
|
z->I[0] = z->l;
|
||||||
|
z->I[1] = z->l;
|
||||||
|
{ int c = z->c; /* do, line 61 */
|
||||||
|
while(1) { /* gopast, line 62 */
|
||||||
|
if (!(in_grouping_U(z, g_v, 1072, 1103))) goto lab1;
|
||||||
|
break;
|
||||||
|
lab1:
|
||||||
|
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
||||||
|
if (c < 0) goto lab0;
|
||||||
|
z->c = c; /* gopast, line 62 */
|
||||||
|
}
|
||||||
|
}
|
||||||
|
z->I[0] = z->c; /* setmark pV, line 62 */
|
||||||
|
while(1) { /* gopast, line 62 */
|
||||||
|
if (!(out_grouping_U(z, g_v, 1072, 1103))) goto lab2;
|
||||||
|
break;
|
||||||
|
lab2:
|
||||||
|
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
||||||
|
if (c < 0) goto lab0;
|
||||||
|
z->c = c; /* gopast, line 62 */
|
||||||
|
}
|
||||||
|
}
|
||||||
|
while(1) { /* gopast, line 63 */
|
||||||
|
if (!(in_grouping_U(z, g_v, 1072, 1103))) goto lab3;
|
||||||
|
break;
|
||||||
|
lab3:
|
||||||
|
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
||||||
|
if (c < 0) goto lab0;
|
||||||
|
z->c = c; /* gopast, line 63 */
|
||||||
|
}
|
||||||
|
}
|
||||||
|
while(1) { /* gopast, line 63 */
|
||||||
|
if (!(out_grouping_U(z, g_v, 1072, 1103))) goto lab4;
|
||||||
|
break;
|
||||||
|
lab4:
|
||||||
|
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
||||||
|
if (c < 0) goto lab0;
|
||||||
|
z->c = c; /* gopast, line 63 */
|
||||||
|
}
|
||||||
|
}
|
||||||
|
z->I[1] = z->c; /* setmark p2, line 63 */
|
||||||
|
lab0:
|
||||||
|
z->c = c;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_R2(struct SN_env * z) {
|
||||||
|
if (!(z->I[1] <= z->c)) return 0;
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_perfective_gerund(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 72 */
|
||||||
|
among_var = find_among_b(z, a_0, 9); /* substring, line 72 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 72 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int m = z->l - z->c; (void) m; /* or, line 76 */
|
||||||
|
if (!(eq_s_b(z, 2, s_0))) goto lab1;
|
||||||
|
goto lab0;
|
||||||
|
lab1:
|
||||||
|
z->c = z->l - m;
|
||||||
|
if (!(eq_s_b(z, 2, s_1))) return 0;
|
||||||
|
}
|
||||||
|
lab0:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 76 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 2:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 83 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_adjective(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 88 */
|
||||||
|
among_var = find_among_b(z, a_1, 26); /* substring, line 88 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 88 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 97 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_adjectival(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
{ int ret = r_adjective(z);
|
||||||
|
if (ret == 0) return 0; /* call adjective, line 102 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
{ int m = z->l - z->c; (void) m; /* try, line 109 */
|
||||||
|
z->ket = z->c; /* [, line 110 */
|
||||||
|
among_var = find_among_b(z, a_2, 8); /* substring, line 110 */
|
||||||
|
if (!(among_var)) { z->c = z->l - m; goto lab0; }
|
||||||
|
z->bra = z->c; /* ], line 110 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: { z->c = z->l - m; goto lab0; }
|
||||||
|
case 1:
|
||||||
|
{ int m = z->l - z->c; (void) m; /* or, line 115 */
|
||||||
|
if (!(eq_s_b(z, 2, s_2))) goto lab2;
|
||||||
|
goto lab1;
|
||||||
|
lab2:
|
||||||
|
z->c = z->l - m;
|
||||||
|
if (!(eq_s_b(z, 2, s_3))) { z->c = z->l - m; goto lab0; }
|
||||||
|
}
|
||||||
|
lab1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 115 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 2:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 122 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
lab0:
|
||||||
|
;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_reflexive(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 129 */
|
||||||
|
among_var = find_among_b(z, a_3, 2); /* substring, line 129 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 129 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 132 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_verb(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 137 */
|
||||||
|
among_var = find_among_b(z, a_4, 46); /* substring, line 137 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 137 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int m = z->l - z->c; (void) m; /* or, line 143 */
|
||||||
|
if (!(eq_s_b(z, 2, s_4))) goto lab1;
|
||||||
|
goto lab0;
|
||||||
|
lab1:
|
||||||
|
z->c = z->l - m;
|
||||||
|
if (!(eq_s_b(z, 2, s_5))) return 0;
|
||||||
|
}
|
||||||
|
lab0:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 143 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 2:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 151 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_noun(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 160 */
|
||||||
|
among_var = find_among_b(z, a_5, 36); /* substring, line 160 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 160 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 167 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_derivational(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 176 */
|
||||||
|
among_var = find_among_b(z, a_6, 2); /* substring, line 176 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 176 */
|
||||||
|
{ int ret = r_R2(z);
|
||||||
|
if (ret == 0) return 0; /* call R2, line 176 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 179 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int r_tidy_up(struct SN_env * z) {
|
||||||
|
int among_var;
|
||||||
|
z->ket = z->c; /* [, line 184 */
|
||||||
|
among_var = find_among_b(z, a_7, 4); /* substring, line 184 */
|
||||||
|
if (!(among_var)) return 0;
|
||||||
|
z->bra = z->c; /* ], line 184 */
|
||||||
|
switch(among_var) {
|
||||||
|
case 0: return 0;
|
||||||
|
case 1:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 188 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
z->ket = z->c; /* [, line 189 */
|
||||||
|
if (!(eq_s_b(z, 2, s_6))) return 0;
|
||||||
|
z->bra = z->c; /* ], line 189 */
|
||||||
|
if (!(eq_s_b(z, 2, s_7))) return 0;
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 189 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 2:
|
||||||
|
if (!(eq_s_b(z, 2, s_8))) return 0;
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 192 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
case 3:
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 194 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
extern int russian_UTF_8_stem(struct SN_env * z) {
|
||||||
|
{ int c = z->c; /* do, line 201 */
|
||||||
|
{ int ret = r_mark_regions(z);
|
||||||
|
if (ret == 0) goto lab0; /* call mark_regions, line 201 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
lab0:
|
||||||
|
z->c = c;
|
||||||
|
}
|
||||||
|
z->lb = z->c; z->c = z->l; /* backwards, line 202 */
|
||||||
|
|
||||||
|
{ int m3; /* setlimit, line 202 */
|
||||||
|
int m = z->l - z->c; (void) m;
|
||||||
|
if (z->c < z->I[0]) return 0;
|
||||||
|
z->c = z->I[0]; /* tomark, line 202 */
|
||||||
|
m3 = z->lb; z->lb = z->c;
|
||||||
|
z->c = z->l - m;
|
||||||
|
{ int m = z->l - z->c; (void) m; /* do, line 203 */
|
||||||
|
{ int m = z->l - z->c; (void) m; /* or, line 204 */
|
||||||
|
{ int ret = r_perfective_gerund(z);
|
||||||
|
if (ret == 0) goto lab3; /* call perfective_gerund, line 204 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
goto lab2;
|
||||||
|
lab3:
|
||||||
|
z->c = z->l - m;
|
||||||
|
{ int m = z->l - z->c; (void) m; /* try, line 205 */
|
||||||
|
{ int ret = r_reflexive(z);
|
||||||
|
if (ret == 0) { z->c = z->l - m; goto lab4; } /* call reflexive, line 205 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
lab4:
|
||||||
|
;
|
||||||
|
}
|
||||||
|
{ int m = z->l - z->c; (void) m; /* or, line 206 */
|
||||||
|
{ int ret = r_adjectival(z);
|
||||||
|
if (ret == 0) goto lab6; /* call adjectival, line 206 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
goto lab5;
|
||||||
|
lab6:
|
||||||
|
z->c = z->l - m;
|
||||||
|
{ int ret = r_verb(z);
|
||||||
|
if (ret == 0) goto lab7; /* call verb, line 206 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
goto lab5;
|
||||||
|
lab7:
|
||||||
|
z->c = z->l - m;
|
||||||
|
{ int ret = r_noun(z);
|
||||||
|
if (ret == 0) goto lab1; /* call noun, line 206 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
lab5:
|
||||||
|
;
|
||||||
|
}
|
||||||
|
lab2:
|
||||||
|
lab1:
|
||||||
|
z->c = z->l - m;
|
||||||
|
}
|
||||||
|
{ int m = z->l - z->c; (void) m; /* try, line 209 */
|
||||||
|
z->ket = z->c; /* [, line 209 */
|
||||||
|
if (!(eq_s_b(z, 2, s_9))) { z->c = z->l - m; goto lab8; }
|
||||||
|
z->bra = z->c; /* ], line 209 */
|
||||||
|
{ int ret;
|
||||||
|
ret = slice_del(z); /* delete, line 209 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
lab8:
|
||||||
|
;
|
||||||
|
}
|
||||||
|
{ int m = z->l - z->c; (void) m; /* do, line 212 */
|
||||||
|
{ int ret = r_derivational(z);
|
||||||
|
if (ret == 0) goto lab9; /* call derivational, line 212 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
lab9:
|
||||||
|
z->c = z->l - m;
|
||||||
|
}
|
||||||
|
{ int m = z->l - z->c; (void) m; /* do, line 213 */
|
||||||
|
{ int ret = r_tidy_up(z);
|
||||||
|
if (ret == 0) goto lab10; /* call tidy_up, line 213 */
|
||||||
|
if (ret < 0) return ret;
|
||||||
|
}
|
||||||
|
lab10:
|
||||||
|
z->c = z->l - m;
|
||||||
|
}
|
||||||
|
z->lb = m3;
|
||||||
|
}
|
||||||
|
z->c = z->lb;
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
extern struct SN_env * russian_UTF_8_create_env(void) { return SN_create_env(0, 2, 0); }
|
||||||
|
|
||||||
|
extern void russian_UTF_8_close_env(struct SN_env * z) { SN_close_env(z); }
|
||||||
|
|
16
contrib/tsearch2/snowball/russian_stem_UTF8.h
Normal file
16
contrib/tsearch2/snowball/russian_stem_UTF8.h
Normal file
@ -0,0 +1,16 @@
|
|||||||
|
|
||||||
|
/* This file was generated automatically by the Snowball to ANSI C compiler */
|
||||||
|
|
||||||
|
#ifdef __cplusplus
|
||||||
|
extern "C" {
|
||||||
|
#endif
|
||||||
|
|
||||||
|
extern struct SN_env * russian_UTF_8_create_env(void);
|
||||||
|
extern void russian_UTF_8_close_env(struct SN_env * z);
|
||||||
|
|
||||||
|
extern int russian_UTF_8_stem(struct SN_env * z);
|
||||||
|
|
||||||
|
#ifdef __cplusplus
|
||||||
|
}
|
||||||
|
#endif
|
||||||
|
|
151
contrib/tsearch2/stopword/russian.stop.utf8
Normal file
151
contrib/tsearch2/stopword/russian.stop.utf8
Normal file
@ -0,0 +1,151 @@
|
|||||||
|
и
|
||||||
|
в
|
||||||
|
во
|
||||||
|
не
|
||||||
|
что
|
||||||
|
он
|
||||||
|
на
|
||||||
|
я
|
||||||
|
с
|
||||||
|
со
|
||||||
|
как
|
||||||
|
а
|
||||||
|
то
|
||||||
|
все
|
||||||
|
она
|
||||||
|
так
|
||||||
|
его
|
||||||
|
но
|
||||||
|
да
|
||||||
|
ты
|
||||||
|
к
|
||||||
|
у
|
||||||
|
же
|
||||||
|
вы
|
||||||
|
за
|
||||||
|
бы
|
||||||
|
по
|
||||||
|
только
|
||||||
|
ее
|
||||||
|
мне
|
||||||
|
было
|
||||||
|
вот
|
||||||
|
от
|
||||||
|
меня
|
||||||
|
еще
|
||||||
|
нет
|
||||||
|
о
|
||||||
|
из
|
||||||
|
ему
|
||||||
|
теперь
|
||||||
|
когда
|
||||||
|
даже
|
||||||
|
ну
|
||||||
|
вдруг
|
||||||
|
ли
|
||||||
|
если
|
||||||
|
уже
|
||||||
|
или
|
||||||
|
ни
|
||||||
|
быть
|
||||||
|
был
|
||||||
|
него
|
||||||
|
до
|
||||||
|
вас
|
||||||
|
нибудь
|
||||||
|
опять
|
||||||
|
уж
|
||||||
|
вам
|
||||||
|
ведь
|
||||||
|
там
|
||||||
|
потом
|
||||||
|
себя
|
||||||
|
ничего
|
||||||
|
ей
|
||||||
|
может
|
||||||
|
они
|
||||||
|
тут
|
||||||
|
где
|
||||||
|
есть
|
||||||
|
надо
|
||||||
|
ней
|
||||||
|
для
|
||||||
|
мы
|
||||||
|
тебя
|
||||||
|
их
|
||||||
|
чем
|
||||||
|
была
|
||||||
|
сам
|
||||||
|
чтоб
|
||||||
|
без
|
||||||
|
будто
|
||||||
|
чего
|
||||||
|
раз
|
||||||
|
тоже
|
||||||
|
себе
|
||||||
|
под
|
||||||
|
будет
|
||||||
|
ж
|
||||||
|
тогда
|
||||||
|
кто
|
||||||
|
этот
|
||||||
|
того
|
||||||
|
потому
|
||||||
|
этого
|
||||||
|
какой
|
||||||
|
совсем
|
||||||
|
ним
|
||||||
|
здесь
|
||||||
|
этом
|
||||||
|
один
|
||||||
|
почти
|
||||||
|
мой
|
||||||
|
тем
|
||||||
|
чтобы
|
||||||
|
нее
|
||||||
|
сейчас
|
||||||
|
были
|
||||||
|
куда
|
||||||
|
зачем
|
||||||
|
всех
|
||||||
|
никогда
|
||||||
|
можно
|
||||||
|
при
|
||||||
|
наконец
|
||||||
|
два
|
||||||
|
об
|
||||||
|
другой
|
||||||
|
хоть
|
||||||
|
после
|
||||||
|
над
|
||||||
|
больше
|
||||||
|
тот
|
||||||
|
через
|
||||||
|
эти
|
||||||
|
нас
|
||||||
|
про
|
||||||
|
всего
|
||||||
|
них
|
||||||
|
какая
|
||||||
|
много
|
||||||
|
разве
|
||||||
|
три
|
||||||
|
эту
|
||||||
|
моя
|
||||||
|
впрочем
|
||||||
|
хорошо
|
||||||
|
свою
|
||||||
|
этой
|
||||||
|
перед
|
||||||
|
иногда
|
||||||
|
лучше
|
||||||
|
чуть
|
||||||
|
том
|
||||||
|
нельзя
|
||||||
|
такой
|
||||||
|
им
|
||||||
|
более
|
||||||
|
всегда
|
||||||
|
конечно
|
||||||
|
всю
|
||||||
|
между
|
@ -82,17 +82,30 @@ insert into pg_ts_dict select
|
|||||||
'English Stemmer. Snowball.'
|
'English Stemmer. Snowball.'
|
||||||
;
|
;
|
||||||
|
|
||||||
CREATE FUNCTION snb_ru_init(internal)
|
CREATE FUNCTION snb_ru_init_koi8(internal)
|
||||||
returns internal
|
returns internal
|
||||||
as 'MODULE_PATHNAME'
|
as 'MODULE_PATHNAME'
|
||||||
language 'C';
|
language 'C';
|
||||||
|
|
||||||
insert into pg_ts_dict select
|
insert into pg_ts_dict select
|
||||||
'ru_stem',
|
'ru_stem_koi8',
|
||||||
'snb_ru_init(internal)',
|
'snb_ru_init_koi8(internal)',
|
||||||
'contrib/russian.stop',
|
'contrib/russian.stop',
|
||||||
'snb_lexize(internal,internal,int4)',
|
'snb_lexize(internal,internal,int4)',
|
||||||
'Russian Stemmer. Snowball.'
|
'Russian Stemmer. Snowball. KOI8 Encoding'
|
||||||
|
;
|
||||||
|
|
||||||
|
CREATE FUNCTION snb_ru_init_utf8(internal)
|
||||||
|
returns internal
|
||||||
|
as 'MODULE_PATHNAME'
|
||||||
|
language 'C';
|
||||||
|
|
||||||
|
insert into pg_ts_dict select
|
||||||
|
'ru_stem_utf8',
|
||||||
|
'snb_ru_init_utf8(internal)',
|
||||||
|
'contrib/russian.stop.utf8',
|
||||||
|
'snb_lexize(internal,internal,int4)',
|
||||||
|
'Russian Stemmer. Snowball. UTF8 Encoding'
|
||||||
;
|
;
|
||||||
|
|
||||||
CREATE FUNCTION spell_init(internal)
|
CREATE FUNCTION spell_init(internal)
|
||||||
@ -270,6 +283,7 @@ CREATE FUNCTION show_curcfg()
|
|||||||
|
|
||||||
insert into pg_ts_cfg values ('default', 'default','C');
|
insert into pg_ts_cfg values ('default', 'default','C');
|
||||||
insert into pg_ts_cfg values ('default_russian', 'default','ru_RU.KOI8-R');
|
insert into pg_ts_cfg values ('default_russian', 'default','ru_RU.KOI8-R');
|
||||||
|
insert into pg_ts_cfg values ('utf8_russian', 'default','ru_RU.UTF-8');
|
||||||
insert into pg_ts_cfg values ('simple', 'default');
|
insert into pg_ts_cfg values ('simple', 'default');
|
||||||
|
|
||||||
insert into pg_ts_cfgmap values ('default', 'lword', '{en_stem}');
|
insert into pg_ts_cfgmap values ('default', 'lword', '{en_stem}');
|
||||||
@ -292,24 +306,43 @@ insert into pg_ts_cfgmap values ('default', 'float', '{simple}');
|
|||||||
insert into pg_ts_cfgmap values ('default', 'int', '{simple}');
|
insert into pg_ts_cfgmap values ('default', 'int', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default', 'uint', '{simple}');
|
insert into pg_ts_cfgmap values ('default', 'uint', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'lword', '{en_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'lword', '{en_stem}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'nlword', '{ru_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'nlword', '{ru_stem_koi8}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'word', '{ru_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'word', '{ru_stem_koi8}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'email', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'email', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'url', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'url', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'host', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'host', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'sfloat', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'sfloat', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'version', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'version', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'part_hword', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'part_hword', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'nlpart_hword', '{ru_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'nlpart_hword', '{ru_stem_koi8}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'lpart_hword', '{en_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'lpart_hword', '{en_stem}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'hword', '{ru_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'hword', '{ru_stem_koi8}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'lhword', '{en_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'lhword', '{en_stem}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'nlhword', '{ru_stem}');
|
insert into pg_ts_cfgmap values ('default_russian', 'nlhword', '{ru_stem_koi8}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'uri', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'uri', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'file', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'file', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'float', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'float', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'int', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'int', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('default_russian', 'uint', '{simple}');
|
insert into pg_ts_cfgmap values ('default_russian', 'uint', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'lword', '{en_stem}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'nlword', '{ru_stem_utf8}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'word', '{ru_stem_utf8}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'email', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'url', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'host', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'sfloat', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'version', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'part_hword', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'nlpart_hword', '{ru_stem_utf8}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'lpart_hword', '{en_stem}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'hword', '{ru_stem_utf8}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'lhword', '{en_stem}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'nlhword', '{ru_stem_utf8}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'uri', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'file', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'float', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'int', '{simple}');
|
||||||
|
insert into pg_ts_cfgmap values ('utf8_russian', 'uint', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('simple', 'lword', '{simple}');
|
insert into pg_ts_cfgmap values ('simple', 'lword', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('simple', 'nlword', '{simple}');
|
insert into pg_ts_cfgmap values ('simple', 'nlword', '{simple}');
|
||||||
insert into pg_ts_cfgmap values ('simple', 'word', '{simple}');
|
insert into pg_ts_cfgmap values ('simple', 'word', '{simple}');
|
||||||
|
Loading…
x
Reference in New Issue
Block a user