X-Git-Url: https://git.mdrn.pl/pylucene.git/blobdiff_plain/a2e61f0c04805cfcb8706176758d1283c7e3a55c..aaeed5504b982cf3545252ab528713250aa33eed:/lucene-java-3.4.0/lucene/contrib/analyzers/common/src/java/org/tartarus/snowball/ext/RussianStemmer.java?ds=sidebyside diff --git a/lucene-java-3.4.0/lucene/contrib/analyzers/common/src/java/org/tartarus/snowball/ext/RussianStemmer.java b/lucene-java-3.4.0/lucene/contrib/analyzers/common/src/java/org/tartarus/snowball/ext/RussianStemmer.java deleted file mode 100644 index fad1835..0000000 --- a/lucene-java-3.4.0/lucene/contrib/analyzers/common/src/java/org/tartarus/snowball/ext/RussianStemmer.java +++ /dev/null @@ -1,727 +0,0 @@ -// This file was generated automatically by the Snowball to Java compiler - -package org.tartarus.snowball.ext; -import org.tartarus.snowball.SnowballProgram; -import org.tartarus.snowball.Among; - -/** - * Generated class implementing code defined by a snowball script. - */ -public class RussianStemmer extends SnowballProgram { - - private Among a_0[] = { - new Among ( "\u0432", -1, 1, "", this), - new Among ( "\u0438\u0432", 0, 2, "", this), - new Among ( "\u044B\u0432", 0, 2, "", this), - new Among ( "\u0432\u0448\u0438", -1, 1, "", this), - new Among ( "\u0438\u0432\u0448\u0438", 3, 2, "", this), - new Among ( "\u044B\u0432\u0448\u0438", 3, 2, "", this), - new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, "", this), - new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, "", this), - new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, "", this) - }; - - private Among a_1[] = { - new Among ( "\u0435\u0435", -1, 1, "", this), - new Among ( "\u0438\u0435", -1, 1, "", this), - new Among ( "\u043E\u0435", -1, 1, "", this), - new Among ( "\u044B\u0435", -1, 1, "", this), - new Among ( "\u0438\u043C\u0438", -1, 1, "", this), - new Among ( "\u044B\u043C\u0438", -1, 1, "", this), - new Among ( "\u0435\u0439", -1, 1, "", this), - new Among ( "\u0438\u0439", -1, 1, "", this), - new Among ( "\u043E\u0439", -1, 1, "", this), - new Among ( "\u044B\u0439", -1, 1, "", this), - new Among ( "\u0435\u043C", -1, 1, "", this), - new Among ( "\u0438\u043C", -1, 1, "", this), - new Among ( "\u043E\u043C", -1, 1, "", this), - new Among ( "\u044B\u043C", -1, 1, "", this), - new Among ( "\u0435\u0433\u043E", -1, 1, "", this), - new Among ( "\u043E\u0433\u043E", -1, 1, "", this), - new Among ( "\u0435\u043C\u0443", -1, 1, "", this), - new Among ( "\u043E\u043C\u0443", -1, 1, "", this), - new Among ( "\u0438\u0445", -1, 1, "", this), - new Among ( "\u044B\u0445", -1, 1, "", this), - new Among ( "\u0435\u044E", -1, 1, "", this), - new Among ( "\u043E\u044E", -1, 1, "", this), - new Among ( "\u0443\u044E", -1, 1, "", this), - new Among ( "\u044E\u044E", -1, 1, "", this), - new Among ( "\u0430\u044F", -1, 1, "", this), - new Among ( "\u044F\u044F", -1, 1, "", this) - }; - - private Among a_2[] = { - new Among ( "\u0435\u043C", -1, 1, "", this), - new Among ( "\u043D\u043D", -1, 1, "", this), - new Among ( "\u0432\u0448", -1, 1, "", this), - new Among ( "\u0438\u0432\u0448", 2, 2, "", this), - new Among ( "\u044B\u0432\u0448", 2, 2, "", this), - new Among ( "\u0449", -1, 1, "", this), - new Among ( "\u044E\u0449", 5, 1, "", this), - new Among ( "\u0443\u044E\u0449", 6, 2, "", this) - }; - - private Among a_3[] = { - new Among ( "\u0441\u044C", -1, 1, "", this), - new Among ( "\u0441\u044F", -1, 1, "", this) - }; - - private Among a_4[] = { - new Among ( "\u043B\u0430", -1, 1, "", this), - new Among ( "\u0438\u043B\u0430", 0, 2, "", this), - new Among ( "\u044B\u043B\u0430", 0, 2, "", this), - new Among ( "\u043D\u0430", -1, 1, "", this), - new Among ( "\u0435\u043D\u0430", 3, 2, "", this), - new Among ( "\u0435\u0442\u0435", -1, 1, "", this), - new Among ( "\u0438\u0442\u0435", -1, 2, "", this), - new Among ( "\u0439\u0442\u0435", -1, 1, "", this), - new Among ( "\u0435\u0439\u0442\u0435", 7, 2, "", this), - new Among ( "\u0443\u0439\u0442\u0435", 7, 2, "", this), - new Among ( "\u043B\u0438", -1, 1, "", this), - new Among ( "\u0438\u043B\u0438", 10, 2, "", this), - new Among ( "\u044B\u043B\u0438", 10, 2, "", this), - new Among ( "\u0439", -1, 1, "", this), - new Among ( "\u0435\u0439", 13, 2, "", this), - new Among ( "\u0443\u0439", 13, 2, "", this), - new Among ( "\u043B", -1, 1, "", this), - new Among ( "\u0438\u043B", 16, 2, "", this), - new Among ( "\u044B\u043B", 16, 2, "", this), - new Among ( "\u0435\u043C", -1, 1, "", this), - new Among ( "\u0438\u043C", -1, 2, "", this), - new Among ( "\u044B\u043C", -1, 2, "", this), - new Among ( "\u043D", -1, 1, "", this), - new Among ( "\u0435\u043D", 22, 2, "", this), - new Among ( "\u043B\u043E", -1, 1, "", this), - new Among ( "\u0438\u043B\u043E", 24, 2, "", this), - new Among ( "\u044B\u043B\u043E", 24, 2, "", this), - new Among ( "\u043D\u043E", -1, 1, "", this), - new Among ( "\u0435\u043D\u043E", 27, 2, "", this), - new Among ( "\u043D\u043D\u043E", 27, 1, "", this), - new Among ( "\u0435\u0442", -1, 1, "", this), - new Among ( "\u0443\u0435\u0442", 30, 2, "", this), - new Among ( "\u0438\u0442", -1, 2, "", this), - new Among ( "\u044B\u0442", -1, 2, "", this), - new Among ( "\u044E\u0442", -1, 1, "", this), - new Among ( "\u0443\u044E\u0442", 34, 2, "", this), - new Among ( "\u044F\u0442", -1, 2, "", this), - new Among ( "\u043D\u044B", -1, 1, "", this), - new Among ( "\u0435\u043D\u044B", 37, 2, "", this), - new Among ( "\u0442\u044C", -1, 1, "", this), - new Among ( "\u0438\u0442\u044C", 39, 2, "", this), - new Among ( "\u044B\u0442\u044C", 39, 2, "", this), - new Among ( "\u0435\u0448\u044C", -1, 1, "", this), - new Among ( "\u0438\u0448\u044C", -1, 2, "", this), - new Among ( "\u044E", -1, 2, "", this), - new Among ( "\u0443\u044E", 44, 2, "", this) - }; - - private Among a_5[] = { - new Among ( "\u0430", -1, 1, "", this), - new Among ( "\u0435\u0432", -1, 1, "", this), - new Among ( "\u043E\u0432", -1, 1, "", this), - new Among ( "\u0435", -1, 1, "", this), - new Among ( "\u0438\u0435", 3, 1, "", this), - new Among ( "\u044C\u0435", 3, 1, "", this), - new Among ( "\u0438", -1, 1, "", this), - new Among ( "\u0435\u0438", 6, 1, "", this), - new Among ( "\u0438\u0438", 6, 1, "", this), - new Among ( "\u0430\u043C\u0438", 6, 1, "", this), - new Among ( "\u044F\u043C\u0438", 6, 1, "", this), - new Among ( "\u0438\u044F\u043C\u0438", 10, 1, "", this), - new Among ( "\u0439", -1, 1, "", this), - new Among ( "\u0435\u0439", 12, 1, "", this), - new Among ( "\u0438\u0435\u0439", 13, 1, "", this), - new Among ( "\u0438\u0439", 12, 1, "", this), - new Among ( "\u043E\u0439", 12, 1, "", this), - new Among ( "\u0430\u043C", -1, 1, "", this), - new Among ( "\u0435\u043C", -1, 1, "", this), - new Among ( "\u0438\u0435\u043C", 18, 1, "", this), - new Among ( "\u043E\u043C", -1, 1, "", this), - new Among ( "\u044F\u043C", -1, 1, "", this), - new Among ( "\u0438\u044F\u043C", 21, 1, "", this), - new Among ( "\u043E", -1, 1, "", this), - new Among ( "\u0443", -1, 1, "", this), - new Among ( "\u0430\u0445", -1, 1, "", this), - new Among ( "\u044F\u0445", -1, 1, "", this), - new Among ( "\u0438\u044F\u0445", 26, 1, "", this), - new Among ( "\u044B", -1, 1, "", this), - new Among ( "\u044C", -1, 1, "", this), - new Among ( "\u044E", -1, 1, "", this), - new Among ( "\u0438\u044E", 30, 1, "", this), - new Among ( "\u044C\u044E", 30, 1, "", this), - new Among ( "\u044F", -1, 1, "", this), - new Among ( "\u0438\u044F", 33, 1, "", this), - new Among ( "\u044C\u044F", 33, 1, "", this) - }; - - private Among a_6[] = { - new Among ( "\u043E\u0441\u0442", -1, 1, "", this), - new Among ( "\u043E\u0441\u0442\u044C", -1, 1, "", this) - }; - - private Among a_7[] = { - new Among ( "\u0435\u0439\u0448\u0435", -1, 1, "", this), - new Among ( "\u043D", -1, 2, "", this), - new Among ( "\u0435\u0439\u0448", -1, 1, "", this), - new Among ( "\u044C", -1, 3, "", this) - }; - - private static final char g_v[] = {33, 65, 8, 232 }; - - private int I_p2; - private int I_pV; - - private void copy_from(RussianStemmer other) { - I_p2 = other.I_p2; - I_pV = other.I_pV; - super.copy_from(other); - } - - private boolean r_mark_regions() { - int v_1; - // (, line 57 - I_pV = limit; - I_p2 = limit; - // do, line 61 - v_1 = cursor; - lab0: do { - // (, line 61 - // gopast, line 62 - golab1: while(true) - { - lab2: do { - if (!(in_grouping(g_v, 1072, 1103))) - { - break lab2; - } - break golab1; - } while (false); - if (cursor >= limit) - { - break lab0; - } - cursor++; - } - // setmark pV, line 62 - I_pV = cursor; - // gopast, line 62 - golab3: while(true) - { - lab4: do { - if (!(out_grouping(g_v, 1072, 1103))) - { - break lab4; - } - break golab3; - } while (false); - if (cursor >= limit) - { - break lab0; - } - cursor++; - } - // gopast, line 63 - golab5: while(true) - { - lab6: do { - if (!(in_grouping(g_v, 1072, 1103))) - { - break lab6; - } - break golab5; - } while (false); - if (cursor >= limit) - { - break lab0; - } - cursor++; - } - // gopast, line 63 - golab7: while(true) - { - lab8: do { - if (!(out_grouping(g_v, 1072, 1103))) - { - break lab8; - } - break golab7; - } while (false); - if (cursor >= limit) - { - break lab0; - } - cursor++; - } - // setmark p2, line 63 - I_p2 = cursor; - } while (false); - cursor = v_1; - return true; - } - - private boolean r_R2() { - if (!(I_p2 <= cursor)) - { - return false; - } - return true; - } - - private boolean r_perfective_gerund() { - int among_var; - int v_1; - // (, line 71 - // [, line 72 - ket = cursor; - // substring, line 72 - among_var = find_among_b(a_0, 9); - if (among_var == 0) - { - return false; - } - // ], line 72 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 76 - // or, line 76 - lab0: do { - v_1 = limit - cursor; - lab1: do { - // literal, line 76 - if (!(eq_s_b(1, "\u0430"))) - { - break lab1; - } - break lab0; - } while (false); - cursor = limit - v_1; - // literal, line 76 - if (!(eq_s_b(1, "\u044F"))) - { - return false; - } - } while (false); - // delete, line 76 - slice_del(); - break; - case 2: - // (, line 83 - // delete, line 83 - slice_del(); - break; - } - return true; - } - - private boolean r_adjective() { - int among_var; - // (, line 87 - // [, line 88 - ket = cursor; - // substring, line 88 - among_var = find_among_b(a_1, 26); - if (among_var == 0) - { - return false; - } - // ], line 88 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 97 - // delete, line 97 - slice_del(); - break; - } - return true; - } - - private boolean r_adjectival() { - int among_var; - int v_1; - int v_2; - // (, line 101 - // call adjective, line 102 - if (!r_adjective()) - { - return false; - } - // try, line 109 - v_1 = limit - cursor; - lab0: do { - // (, line 109 - // [, line 110 - ket = cursor; - // substring, line 110 - among_var = find_among_b(a_2, 8); - if (among_var == 0) - { - cursor = limit - v_1; - break lab0; - } - // ], line 110 - bra = cursor; - switch(among_var) { - case 0: - cursor = limit - v_1; - break lab0; - case 1: - // (, line 115 - // or, line 115 - lab1: do { - v_2 = limit - cursor; - lab2: do { - // literal, line 115 - if (!(eq_s_b(1, "\u0430"))) - { - break lab2; - } - break lab1; - } while (false); - cursor = limit - v_2; - // literal, line 115 - if (!(eq_s_b(1, "\u044F"))) - { - cursor = limit - v_1; - break lab0; - } - } while (false); - // delete, line 115 - slice_del(); - break; - case 2: - // (, line 122 - // delete, line 122 - slice_del(); - break; - } - } while (false); - return true; - } - - private boolean r_reflexive() { - int among_var; - // (, line 128 - // [, line 129 - ket = cursor; - // substring, line 129 - among_var = find_among_b(a_3, 2); - if (among_var == 0) - { - return false; - } - // ], line 129 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 132 - // delete, line 132 - slice_del(); - break; - } - return true; - } - - private boolean r_verb() { - int among_var; - int v_1; - // (, line 136 - // [, line 137 - ket = cursor; - // substring, line 137 - among_var = find_among_b(a_4, 46); - if (among_var == 0) - { - return false; - } - // ], line 137 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 143 - // or, line 143 - lab0: do { - v_1 = limit - cursor; - lab1: do { - // literal, line 143 - if (!(eq_s_b(1, "\u0430"))) - { - break lab1; - } - break lab0; - } while (false); - cursor = limit - v_1; - // literal, line 143 - if (!(eq_s_b(1, "\u044F"))) - { - return false; - } - } while (false); - // delete, line 143 - slice_del(); - break; - case 2: - // (, line 151 - // delete, line 151 - slice_del(); - break; - } - return true; - } - - private boolean r_noun() { - int among_var; - // (, line 159 - // [, line 160 - ket = cursor; - // substring, line 160 - among_var = find_among_b(a_5, 36); - if (among_var == 0) - { - return false; - } - // ], line 160 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 167 - // delete, line 167 - slice_del(); - break; - } - return true; - } - - private boolean r_derivational() { - int among_var; - // (, line 175 - // [, line 176 - ket = cursor; - // substring, line 176 - among_var = find_among_b(a_6, 2); - if (among_var == 0) - { - return false; - } - // ], line 176 - bra = cursor; - // call R2, line 176 - if (!r_R2()) - { - return false; - } - switch(among_var) { - case 0: - return false; - case 1: - // (, line 179 - // delete, line 179 - slice_del(); - break; - } - return true; - } - - private boolean r_tidy_up() { - int among_var; - // (, line 183 - // [, line 184 - ket = cursor; - // substring, line 184 - among_var = find_among_b(a_7, 4); - if (among_var == 0) - { - return false; - } - // ], line 184 - bra = cursor; - switch(among_var) { - case 0: - return false; - case 1: - // (, line 188 - // delete, line 188 - slice_del(); - // [, line 189 - ket = cursor; - // literal, line 189 - if (!(eq_s_b(1, "\u043D"))) - { - return false; - } - // ], line 189 - bra = cursor; - // literal, line 189 - if (!(eq_s_b(1, "\u043D"))) - { - return false; - } - // delete, line 189 - slice_del(); - break; - case 2: - // (, line 192 - // literal, line 192 - if (!(eq_s_b(1, "\u043D"))) - { - return false; - } - // delete, line 192 - slice_del(); - break; - case 3: - // (, line 194 - // delete, line 194 - slice_del(); - break; - } - return true; - } - - public boolean stem() { - int v_1; - int v_2; - int v_3; - int v_4; - int v_5; - int v_6; - int v_7; - int v_8; - int v_9; - int v_10; - // (, line 199 - // do, line 201 - v_1 = cursor; - lab0: do { - // call mark_regions, line 201 - if (!r_mark_regions()) - { - break lab0; - } - } while (false); - cursor = v_1; - // backwards, line 202 - limit_backward = cursor; cursor = limit; - // setlimit, line 202 - v_2 = limit - cursor; - // tomark, line 202 - if (cursor < I_pV) - { - return false; - } - cursor = I_pV; - v_3 = limit_backward; - limit_backward = cursor; - cursor = limit - v_2; - // (, line 202 - // do, line 203 - v_4 = limit - cursor; - lab1: do { - // (, line 203 - // or, line 204 - lab2: do { - v_5 = limit - cursor; - lab3: do { - // call perfective_gerund, line 204 - if (!r_perfective_gerund()) - { - break lab3; - } - break lab2; - } while (false); - cursor = limit - v_5; - // (, line 205 - // try, line 205 - v_6 = limit - cursor; - lab4: do { - // call reflexive, line 205 - if (!r_reflexive()) - { - cursor = limit - v_6; - break lab4; - } - } while (false); - // or, line 206 - lab5: do { - v_7 = limit - cursor; - lab6: do { - // call adjectival, line 206 - if (!r_adjectival()) - { - break lab6; - } - break lab5; - } while (false); - cursor = limit - v_7; - lab7: do { - // call verb, line 206 - if (!r_verb()) - { - break lab7; - } - break lab5; - } while (false); - cursor = limit - v_7; - // call noun, line 206 - if (!r_noun()) - { - break lab1; - } - } while (false); - } while (false); - } while (false); - cursor = limit - v_4; - // try, line 209 - v_8 = limit - cursor; - lab8: do { - // (, line 209 - // [, line 209 - ket = cursor; - // literal, line 209 - if (!(eq_s_b(1, "\u0438"))) - { - cursor = limit - v_8; - break lab8; - } - // ], line 209 - bra = cursor; - // delete, line 209 - slice_del(); - } while (false); - // do, line 212 - v_9 = limit - cursor; - lab9: do { - // call derivational, line 212 - if (!r_derivational()) - { - break lab9; - } - } while (false); - cursor = limit - v_9; - // do, line 213 - v_10 = limit - cursor; - lab10: do { - // call tidy_up, line 213 - if (!r_tidy_up()) - { - break lab10; - } - } while (false); - cursor = limit - v_10; - limit_backward = v_3; - cursor = limit_backward; return true; - } - -} -