1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193
|
<?xml version="1.0" encoding="utf-8"?>
<test>
<requires>
<lemmatizer_base/>
</requires>
<name>aot morphology for english and german</name>
<config>
common
{
lemmatizer_base = <local>lemmatizer_base</local>
}
searchd
{
<searchd_settings/>
workers = threads
}
source test1
{
type = mysql
<sql_settings/>
sql_query_pre = set names utf8
sql_query = select * from test_table
sql_attr_uint = gid
}
index test1
{
source = test1
path = <data_path/>/testen1
morphology = lemmatize_en_all
blend_chars = @, .
wordforms = <this_test/>/wordforms.txt
}
index test2 : test1
{
path = <data_path/>/testen2
morphology = lemmatize_en
}
index test2ruen : test2
{
path = <data_path/>/testruen2
morphology = lemmatize_en,lemmatize_ru
}
index test2red : test2
{
path = <data_path/>/testruende2
charset_table = 0..9, A..Z, a..z, _, U+C0..U+D6, U+D9..U+DF, U+E0..U+F6, U+F9..U+FF, U+410..U+42F->U+430..U+44F, U+430..U+44F
morphology = lemmatize_en,lemmatize_ru,lemmatize_de
}
index testrt1
{
type = rt
path = <data_path/>/testenrt1
morphology = lemmatize_en_all
blend_chars = @, .
wordforms = <this_test/>/wordforms.txt
rt_attr_uint = gid
rt_field = title
}
index testrt2 : testrt1
{
path = <data_path/>/testenrt2
morphology = lemmatize_en
}
index testrt2ruen : testrt2
{
path = <data_path/>/testruenrt2
morphology = lemmatize_en,lemmatize_ru
}
index testrt2red : testrt2
{
path = <data_path/>/testred2
charset_table = 0..9, A..Z, a..z, _, U+C0..U+D6, U+D9..U+DF, U+E0..U+F6, U+F9..U+FF, U+410..U+42F->U+430..U+44F, U+430..U+44F
morphology = lemmatize_en,lemmatize_ru,lemmatize_de
}
index aot_plain
{
source = test1
path = <data_path/>/aot_plain
docinfo = extern
morphology = lemmatize_ru_all
blend_chars = .
}
index aot_exact
{
source = test1
path = <data_path/>/aot_exact
docinfo = extern
morphology = lemmatize_ru_all
blend_chars = .
index_exact_words = 1
min_prefix_len = 1
index_field_lengths = 1
morphology = stem_en, lemmatize_ru_all
}
</config>
<metaindex name='META:rt'>
<index>testrt1</index>
<index>testrt2</index>
<index>testrt2ruen</index>
<index>testrt2red</index>
</metaindex>
<metaindex name='META:all'>
<index>test1</index>
<index>test2</index>
<index>test2ruen</index>
<index>testrt1</index>
<index>testrt2</index>
<index>testrt2ruen</index>
<index>testrt2red</index>
</metaindex>
<metaindex name='META:aot'>
<index>aot_plain</index>
<index>aot_exact</index>
</metaindex>
<db_create>
CREATE TABLE test_table
(
id INTEGER PRIMARY KEY NOT NULL,
gid INTEGER NOT NULL,
title VARCHAR(255) CHARACTER SET utf8 NOT NULL
);
</db_create>
<db_drop>DROP TABLE IF EXISTS test_table</db_drop>
<db_insert>SET NAMES utf8</db_insert>
<db_insert>INSERT INTO test_table VALUES
( 1, 11, 'wives and men' ),
( 2, 11, 'wife and man' ),
( 3, 11, 'children and women' ),
( 4, 11, 'child and woman' ),
( 5, 11, 'as it become known' ),
( 6, 11, 'somebody indices' ),
( 7, 11, 'nobody@nowhere knew everything super' ),
( 8, 11, 'стали well-known как путин markieren' )
</db_insert>
<sphqueries>
<sphinxql>INSERT INTO META:rt VALUES ( 1, 'wives and men', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 2, 'wife and man', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 3, 'children and women', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 4, 'child and woman', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 5, 'as it become known', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 6, 'somebody indices', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 7, 'nobody@nowhere knew everything super', 11 )</sphinxql>
<sphinxql>INSERT INTO META:rt VALUES ( 8, 'стали well-known как путин markieren', 11 )</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('wife'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('wives'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('man'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('men'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('super'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('puper'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('"child and woman"'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('"children and women"'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('nobody@nowhere knows'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('путина knew стали'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('путин стал knows'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('путина markierte'); SHOW META</sphinxql>
<sphinxql>SELECT * FROM META:all WHERE MATCH('knew markierte'); SHOW META</sphinxql>
<!-- regressoin aot lemmas at excerpt -->
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', 'молоком', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', '=молоком', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', 'молоко', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', '=молоко', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', '=молока', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молочная ферма', 'META:aot', 'молок*', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('молоко такое же молока и так же молоком но не ком', 'META:aot', 'мол*', 1 as query_mode)</sphinxql>
<sphinxql>CALL SNIPPETS ('много стресса. от багов.', 'META:aot', 'стресс', 1 as query_mode)</sphinxql>
</sphqueries>
</test>
|