// CHECKSTYLE:OFF /* Copyright (c) 2001, Dr Martin Porter Copyright (c) 2002, Richard Boulton All rights reserved. Redistribution and use in source and binary forms, with or without modification, are permitted provided that the following conditions are met: * Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * Redistributions in binary form must reproduce the above copyright * notice, this list of conditions and the following disclaimer in the * documentation and/or other materials provided with the distribution. * Neither the name of the copyright holders nor the names of its contributors * may be used to endorse or promote products derived from this software * without specific prior written permission. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ // This file was generated automatically by the Snowball to Java compiler package opennlp.tools.stemmer.snowball; /** * This class was automatically generated by a Snowball to Java compiler * It implements the stemming algorithm defined by a snowball script. */ class russianStemmer extends opennlp.tools.stemmer.snowball.AbstractSnowballStemmer { private static final long serialVersionUID = 1L; private final static russianStemmer methodObject = new russianStemmer (); private final static Among a_0[] = { new Among ( "\u0432", -1, 1, "", methodObject ), new Among ( "\u0438\u0432", 0, 2, "", methodObject ), new Among ( "\u044B\u0432", 0, 2, "", methodObject ), new Among ( "\u0432\u0448\u0438", -1, 1, "", methodObject ), new Among ( "\u0438\u0432\u0448\u0438", 3, 2, "", methodObject ), new Among ( "\u044B\u0432\u0448\u0438", 3, 2, "", methodObject ), new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, "", methodObject ), new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject ), new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject ) }; private final static Among a_1[] = { new Among ( "\u0435\u0435", -1, 1, "", methodObject ), new Among ( "\u0438\u0435", -1, 1, "", methodObject ), new Among ( "\u043E\u0435", -1, 1, "", methodObject ), new Among ( "\u044B\u0435", -1, 1, "", methodObject ), new Among ( "\u0438\u043C\u0438", -1, 1, "", methodObject ), new Among ( "\u044B\u043C\u0438", -1, 1, "", methodObject ), new Among ( "\u0435\u0439", -1, 1, "", methodObject ), new Among ( "\u0438\u0439", -1, 1, "", methodObject ), new Among ( "\u043E\u0439", -1, 1, "", methodObject ), new Among ( "\u044B\u0439", -1, 1, "", methodObject ), new Among ( "\u0435\u043C", -1, 1, "", methodObject ), new Among ( "\u0438\u043C", -1, 1, "", methodObject ), new Among ( "\u043E\u043C", -1, 1, "", methodObject ), new Among ( "\u044B\u043C", -1, 1, "", methodObject ), new Among ( "\u0435\u0433\u043E", -1, 1, "", methodObject ), new Among ( "\u043E\u0433\u043E", -1, 1, "", methodObject ), new Among ( "\u0435\u043C\u0443", -1, 1, "", methodObject ), new Among ( "\u043E\u043C\u0443", -1, 1, "", methodObject ), new Among ( "\u0438\u0445", -1, 1, "", methodObject ), new Among ( "\u044B\u0445", -1, 1, "", methodObject ), new Among ( "\u0435\u044E", -1, 1, "", methodObject ), new Among ( "\u043E\u044E", -1, 1, "", methodObject ), new Among ( "\u0443\u044E", -1, 1, "", methodObject ), new Among ( "\u044E\u044E", -1, 1, "", methodObject ), new Among ( "\u0430\u044F", -1, 1, "", methodObject ), new Among ( "\u044F\u044F", -1, 1, "", methodObject ) }; private final static Among a_2[] = { new Among ( "\u0435\u043C", -1, 1, "", methodObject ), new Among ( "\u043D\u043D", -1, 1, "", methodObject ), new Among ( "\u0432\u0448", -1, 1, "", methodObject ), new Among ( "\u0438\u0432\u0448", 2, 2, "", methodObject ), new Among ( "\u044B\u0432\u0448", 2, 2, "", methodObject ), new Among ( "\u0449", -1, 1, "", methodObject ), new Among ( "\u044E\u0449", 5, 1, "", methodObject ), new Among ( "\u0443\u044E\u0449", 6, 2, "", methodObject ) }; private final static Among a_3[] = { new Among ( "\u0441\u044C", -1, 1, "", methodObject ), new Among ( "\u0441\u044F", -1, 1, "", methodObject ) }; private final static Among a_4[] = { new Among ( "\u043B\u0430", -1, 1, "", methodObject ), new Among ( "\u0438\u043B\u0430", 0, 2, "", methodObject ), new Among ( "\u044B\u043B\u0430", 0, 2, "", methodObject ), new Among ( "\u043D\u0430", -1, 1, "", methodObject ), new Among ( "\u0435\u043D\u0430", 3, 2, "", methodObject ), new Among ( "\u0435\u0442\u0435", -1, 1, "", methodObject ), new Among ( "\u0438\u0442\u0435", -1, 2, "", methodObject ), new Among ( "\u0439\u0442\u0435", -1, 1, "", methodObject ), new Among ( "\u0435\u0439\u0442\u0435", 7, 2, "", methodObject ), new Among ( "\u0443\u0439\u0442\u0435", 7, 2, "", methodObject ), new Among ( "\u043B\u0438", -1, 1, "", methodObject ), new Among ( "\u0438\u043B\u0438", 10, 2, "", methodObject ), new Among ( "\u044B\u043B\u0438", 10, 2, "", methodObject ), new Among ( "\u0439", -1, 1, "", methodObject ), new Among ( "\u0435\u0439", 13, 2, "", methodObject ), new Among ( "\u0443\u0439", 13, 2, "", methodObject ), new Among ( "\u043B", -1, 1, "", methodObject ), new Among ( "\u0438\u043B", 16, 2, "", methodObject ), new Among ( "\u044B\u043B", 16, 2, "", methodObject ), new Among ( "\u0435\u043C", -1, 1, "", methodObject ), new Among ( "\u0438\u043C", -1, 2, "", methodObject ), new Among ( "\u044B\u043C", -1, 2, "", methodObject ), new Among ( "\u043D", -1, 1, "", methodObject ), new Among ( "\u0435\u043D", 22, 2, "", methodObject ), new Among ( "\u043B\u043E", -1, 1, "", methodObject ), new Among ( "\u0438\u043B\u043E", 24, 2, "", methodObject ), new Among ( "\u044B\u043B\u043E", 24, 2, "", methodObject ), new Among ( "\u043D\u043E", -1, 1, "", methodObject ), new Among ( "\u0435\u043D\u043E", 27, 2, "", methodObject ), new Among ( "\u043D\u043D\u043E", 27, 1, "", methodObject ), new Among ( "\u0435\u0442", -1, 1, "", methodObject ), new Among ( "\u0443\u0435\u0442", 30, 2, "", methodObject ), new Among ( "\u0438\u0442", -1, 2, "", methodObject ), new Among ( "\u044B\u0442", -1, 2, "", methodObject ), new Among ( "\u044E\u0442", -1, 1, "", methodObject ), new Among ( "\u0443\u044E\u0442", 34, 2, "", methodObject ), new Among ( "\u044F\u0442", -1, 2, "", methodObject ), new Among ( "\u043D\u044B", -1, 1, "", methodObject ), new Among ( "\u0435\u043D\u044B", 37, 2, "", methodObject ), new Among ( "\u0442\u044C", -1, 1, "", methodObject ), new Among ( "\u0438\u0442\u044C", 39, 2, "", methodObject ), new Among ( "\u044B\u0442\u044C", 39, 2, "", methodObject ), new Among ( "\u0435\u0448\u044C", -1, 1, "", methodObject ), new Among ( "\u0438\u0448\u044C", -1, 2, "", methodObject ), new Among ( "\u044E", -1, 2, "", methodObject ), new Among ( "\u0443\u044E", 44, 2, "", methodObject ) }; private final static Among a_5[] = { new Among ( "\u0430", -1, 1, "", methodObject ), new Among ( "\u0435\u0432", -1, 1, "", methodObject ), new Among ( "\u043E\u0432", -1, 1, "", methodObject ), new Among ( "\u0435", -1, 1, "", methodObject ), new Among ( "\u0438\u0435", 3, 1, "", methodObject ), new Among ( "\u044C\u0435", 3, 1, "", methodObject ), new Among ( "\u0438", -1, 1, "", methodObject ), new Among ( "\u0435\u0438", 6, 1, "", methodObject ), new Among ( "\u0438\u0438", 6, 1, "", methodObject ), new Among ( "\u0430\u043C\u0438", 6, 1, "", methodObject ), new Among ( "\u044F\u043C\u0438", 6, 1, "", methodObject ), new Among ( "\u0438\u044F\u043C\u0438", 10, 1, "", methodObject ), new Among ( "\u0439", -1, 1, "", methodObject ), new Among ( "\u0435\u0439", 12, 1, "", methodObject ), new Among ( "\u0438\u0435\u0439", 13, 1, "", methodObject ), new Among ( "\u0438\u0439", 12, 1, "", methodObject ), new Among ( "\u043E\u0439", 12, 1, "", methodObject ), new Among ( "\u0430\u043C", -1, 1, "", methodObject ), new Among ( "\u0435\u043C", -1, 1, "", methodObject ), new Among ( "\u0438\u0435\u043C", 18, 1, "", methodObject ), new Among ( "\u043E\u043C", -1, 1, "", methodObject ), new Among ( "\u044F\u043C", -1, 1, "", methodObject ), new Among ( "\u0438\u044F\u043C", 21, 1, "", methodObject ), new Among ( "\u043E", -1, 1, "", methodObject ), new Among ( "\u0443", -1, 1, "", methodObject ), new Among ( "\u0430\u0445", -1, 1, "", methodObject ), new Among ( "\u044F\u0445", -1, 1, "", methodObject ), new Among ( "\u0438\u044F\u0445", 26, 1, "", methodObject ), new Among ( "\u044B", -1, 1, "", methodObject ), new Among ( "\u044C", -1, 1, "", methodObject ), new Among ( "\u044E", -1, 1, "", methodObject ), new Among ( "\u0438\u044E", 30, 1, "", methodObject ), new Among ( "\u044C\u044E", 30, 1, "", methodObject ), new Among ( "\u044F", -1, 1, "", methodObject ), new Among ( "\u0438\u044F", 33, 1, "", methodObject ), new Among ( "\u044C\u044F", 33, 1, "", methodObject ) }; private final static Among a_6[] = { new Among ( "\u043E\u0441\u0442", -1, 1, "", methodObject ), new Among ( "\u043E\u0441\u0442\u044C", -1, 1, "", methodObject ) }; private final static Among a_7[] = { new Among ( "\u0435\u0439\u0448\u0435", -1, 1, "", methodObject ), new Among ( "\u043D", -1, 2, "", methodObject ), new Among ( "\u0435\u0439\u0448", -1, 1, "", methodObject ), new Among ( "\u044C", -1, 3, "", methodObject ) }; private static final char g_v[] = {33, 65, 8, 232 }; private int I_p2; private int I_pV; private void copy_from(russianStemmer other) { I_p2 = other.I_p2; I_pV = other.I_pV; super.copy_from(other); } private boolean r_mark_regions() { int v_1; // (, line 57 I_pV = limit; I_p2 = limit; // do, line 61 v_1 = cursor; lab0: do { // (, line 61 // gopast, line 62 golab1: while(true) { lab2: do { if (!(in_grouping(g_v, 1072, 1103))) { break lab2; } break golab1; } while (false); if (cursor >= limit) { break lab0; } cursor++; } // setmark pV, line 62 I_pV = cursor; // gopast, line 62 golab3: while(true) { lab4: do { if (!(out_grouping(g_v, 1072, 1103))) { break lab4; } break golab3; } while (false); if (cursor >= limit) { break lab0; } cursor++; } // gopast, line 63 golab5: while(true) { lab6: do { if (!(in_grouping(g_v, 1072, 1103))) { break lab6; } break golab5; } while (false); if (cursor >= limit) { break lab0; } cursor++; } // gopast, line 63 golab7: while(true) { lab8: do { if (!(out_grouping(g_v, 1072, 1103))) { break lab8; } break golab7; } while (false); if (cursor >= limit) { break lab0; } cursor++; } // setmark p2, line 63 I_p2 = cursor; } while (false); cursor = v_1; return true; } private boolean r_R2() { if (!(I_p2 <= cursor)) { return false; } return true; } private boolean r_perfective_gerund() { int among_var; int v_1; // (, line 71 // [, line 72 ket = cursor; // substring, line 72 among_var = find_among_b(a_0, 9); if (among_var == 0) { return false; } // ], line 72 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 76 // or, line 76 lab0: do { v_1 = limit - cursor; lab1: do { // literal, line 76 if (!(eq_s_b(1, "\u0430"))) { break lab1; } break lab0; } while (false); cursor = limit - v_1; // literal, line 76 if (!(eq_s_b(1, "\u044F"))) { return false; } } while (false); // delete, line 76 slice_del(); break; case 2: // (, line 83 // delete, line 83 slice_del(); break; } return true; } private boolean r_adjective() { int among_var; // (, line 87 // [, line 88 ket = cursor; // substring, line 88 among_var = find_among_b(a_1, 26); if (among_var == 0) { return false; } // ], line 88 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 97 // delete, line 97 slice_del(); break; } return true; } private boolean r_adjectival() { int among_var; int v_1; int v_2; // (, line 101 // call adjective, line 102 if (!r_adjective()) { return false; } // try, line 109 v_1 = limit - cursor; lab0: do { // (, line 109 // [, line 110 ket = cursor; // substring, line 110 among_var = find_among_b(a_2, 8); if (among_var == 0) { cursor = limit - v_1; break lab0; } // ], line 110 bra = cursor; switch(among_var) { case 0: cursor = limit - v_1; break lab0; case 1: // (, line 115 // or, line 115 lab1: do { v_2 = limit - cursor; lab2: do { // literal, line 115 if (!(eq_s_b(1, "\u0430"))) { break lab2; } break lab1; } while (false); cursor = limit - v_2; // literal, line 115 if (!(eq_s_b(1, "\u044F"))) { cursor = limit - v_1; break lab0; } } while (false); // delete, line 115 slice_del(); break; case 2: // (, line 122 // delete, line 122 slice_del(); break; } } while (false); return true; } private boolean r_reflexive() { int among_var; // (, line 128 // [, line 129 ket = cursor; // substring, line 129 among_var = find_among_b(a_3, 2); if (among_var == 0) { return false; } // ], line 129 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 132 // delete, line 132 slice_del(); break; } return true; } private boolean r_verb() { int among_var; int v_1; // (, line 136 // [, line 137 ket = cursor; // substring, line 137 among_var = find_among_b(a_4, 46); if (among_var == 0) { return false; } // ], line 137 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 143 // or, line 143 lab0: do { v_1 = limit - cursor; lab1: do { // literal, line 143 if (!(eq_s_b(1, "\u0430"))) { break lab1; } break lab0; } while (false); cursor = limit - v_1; // literal, line 143 if (!(eq_s_b(1, "\u044F"))) { return false; } } while (false); // delete, line 143 slice_del(); break; case 2: // (, line 151 // delete, line 151 slice_del(); break; } return true; } private boolean r_noun() { int among_var; // (, line 159 // [, line 160 ket = cursor; // substring, line 160 among_var = find_among_b(a_5, 36); if (among_var == 0) { return false; } // ], line 160 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 167 // delete, line 167 slice_del(); break; } return true; } private boolean r_derivational() { int among_var; // (, line 175 // [, line 176 ket = cursor; // substring, line 176 among_var = find_among_b(a_6, 2); if (among_var == 0) { return false; } // ], line 176 bra = cursor; // call R2, line 176 if (!r_R2()) { return false; } switch(among_var) { case 0: return false; case 1: // (, line 179 // delete, line 179 slice_del(); break; } return true; } private boolean r_tidy_up() { int among_var; // (, line 183 // [, line 184 ket = cursor; // substring, line 184 among_var = find_among_b(a_7, 4); if (among_var == 0) { return false; } // ], line 184 bra = cursor; switch(among_var) { case 0: return false; case 1: // (, line 188 // delete, line 188 slice_del(); // [, line 189 ket = cursor; // literal, line 189 if (!(eq_s_b(1, "\u043D"))) { return false; } // ], line 189 bra = cursor; // literal, line 189 if (!(eq_s_b(1, "\u043D"))) { return false; } // delete, line 189 slice_del(); break; case 2: // (, line 192 // literal, line 192 if (!(eq_s_b(1, "\u043D"))) { return false; } // delete, line 192 slice_del(); break; case 3: // (, line 194 // delete, line 194 slice_del(); break; } return true; } public boolean stem() { int v_1; int v_2; int v_3; int v_4; int v_5; int v_6; int v_7; int v_8; int v_9; int v_10; // (, line 199 // do, line 201 v_1 = cursor; lab0: do { // call mark_regions, line 201 if (!r_mark_regions()) { break lab0; } } while (false); cursor = v_1; // backwards, line 202 limit_backward = cursor; cursor = limit; // setlimit, line 202 v_2 = limit - cursor; // tomark, line 202 if (cursor < I_pV) { return false; } cursor = I_pV; v_3 = limit_backward; limit_backward = cursor; cursor = limit - v_2; // (, line 202 // do, line 203 v_4 = limit - cursor; lab1: do { // (, line 203 // or, line 204 lab2: do { v_5 = limit - cursor; lab3: do { // call perfective_gerund, line 204 if (!r_perfective_gerund()) { break lab3; } break lab2; } while (false); cursor = limit - v_5; // (, line 205 // try, line 205 v_6 = limit - cursor; lab4: do { // call reflexive, line 205 if (!r_reflexive()) { cursor = limit - v_6; break lab4; } } while (false); // or, line 206 lab5: do { v_7 = limit - cursor; lab6: do { // call adjectival, line 206 if (!r_adjectival()) { break lab6; } break lab5; } while (false); cursor = limit - v_7; lab7: do { // call verb, line 206 if (!r_verb()) { break lab7; } break lab5; } while (false); cursor = limit - v_7; // call noun, line 206 if (!r_noun()) { break lab1; } } while (false); } while (false); } while (false); cursor = limit - v_4; // try, line 209 v_8 = limit - cursor; lab8: do { // (, line 209 // [, line 209 ket = cursor; // literal, line 209 if (!(eq_s_b(1, "\u0438"))) { cursor = limit - v_8; break lab8; } // ], line 209 bra = cursor; // delete, line 209 slice_del(); } while (false); // do, line 212 v_9 = limit - cursor; lab9: do { // call derivational, line 212 if (!r_derivational()) { break lab9; } } while (false); cursor = limit - v_9; // do, line 213 v_10 = limit - cursor; lab10: do { // call tidy_up, line 213 if (!r_tidy_up()) { break lab10; } } while (false); cursor = limit - v_10; limit_backward = v_3; cursor = limit_backward; return true; } public boolean equals( Object o ) { return o instanceof russianStemmer; } public int hashCode() { return russianStemmer.class.getName().hashCode(); } }