All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.tartarus.snowball.ext.russianStemmer Maven / Gradle / Ivy

The newest version!
// This file was generated automatically by the Snowball to Java compiler
// http://snowballstem.org/

package org.tartarus.snowball.ext;

import org.tartarus.snowball.Among;

 /**
  * This class was automatically generated by a Snowball to Java compiler
  * It implements the stemming algorithm defined by a snowball script.
  */

public class russianStemmer extends org.tartarus.snowball.SnowballStemmer {

    private static final long serialVersionUID = 1L;

    private final static Among a_0[] = {
        new Among ( "\u0432", -1, 1 ),
        new Among ( "\u0438\u0432", 0, 2 ),
        new Among ( "\u044B\u0432", 0, 2 ),
        new Among ( "\u0432\u0448\u0438", -1, 1 ),
        new Among ( "\u0438\u0432\u0448\u0438", 3, 2 ),
        new Among ( "\u044B\u0432\u0448\u0438", 3, 2 ),
        new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1 ),
        new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2 ),
        new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2 )
    };

    private final static Among a_1[] = {
        new Among ( "\u0435\u0435", -1, 1 ),
        new Among ( "\u0438\u0435", -1, 1 ),
        new Among ( "\u043E\u0435", -1, 1 ),
        new Among ( "\u044B\u0435", -1, 1 ),
        new Among ( "\u0438\u043C\u0438", -1, 1 ),
        new Among ( "\u044B\u043C\u0438", -1, 1 ),
        new Among ( "\u0435\u0439", -1, 1 ),
        new Among ( "\u0438\u0439", -1, 1 ),
        new Among ( "\u043E\u0439", -1, 1 ),
        new Among ( "\u044B\u0439", -1, 1 ),
        new Among ( "\u0435\u043C", -1, 1 ),
        new Among ( "\u0438\u043C", -1, 1 ),
        new Among ( "\u043E\u043C", -1, 1 ),
        new Among ( "\u044B\u043C", -1, 1 ),
        new Among ( "\u0435\u0433\u043E", -1, 1 ),
        new Among ( "\u043E\u0433\u043E", -1, 1 ),
        new Among ( "\u0435\u043C\u0443", -1, 1 ),
        new Among ( "\u043E\u043C\u0443", -1, 1 ),
        new Among ( "\u0438\u0445", -1, 1 ),
        new Among ( "\u044B\u0445", -1, 1 ),
        new Among ( "\u0435\u044E", -1, 1 ),
        new Among ( "\u043E\u044E", -1, 1 ),
        new Among ( "\u0443\u044E", -1, 1 ),
        new Among ( "\u044E\u044E", -1, 1 ),
        new Among ( "\u0430\u044F", -1, 1 ),
        new Among ( "\u044F\u044F", -1, 1 )
    };

    private final static Among a_2[] = {
        new Among ( "\u0435\u043C", -1, 1 ),
        new Among ( "\u043D\u043D", -1, 1 ),
        new Among ( "\u0432\u0448", -1, 1 ),
        new Among ( "\u0438\u0432\u0448", 2, 2 ),
        new Among ( "\u044B\u0432\u0448", 2, 2 ),
        new Among ( "\u0449", -1, 1 ),
        new Among ( "\u044E\u0449", 5, 1 ),
        new Among ( "\u0443\u044E\u0449", 6, 2 )
    };

    private final static Among a_3[] = {
        new Among ( "\u0441\u044C", -1, 1 ),
        new Among ( "\u0441\u044F", -1, 1 )
    };

    private final static Among a_4[] = {
        new Among ( "\u043B\u0430", -1, 1 ),
        new Among ( "\u0438\u043B\u0430", 0, 2 ),
        new Among ( "\u044B\u043B\u0430", 0, 2 ),
        new Among ( "\u043D\u0430", -1, 1 ),
        new Among ( "\u0435\u043D\u0430", 3, 2 ),
        new Among ( "\u0435\u0442\u0435", -1, 1 ),
        new Among ( "\u0438\u0442\u0435", -1, 2 ),
        new Among ( "\u0439\u0442\u0435", -1, 1 ),
        new Among ( "\u0435\u0439\u0442\u0435", 7, 2 ),
        new Among ( "\u0443\u0439\u0442\u0435", 7, 2 ),
        new Among ( "\u043B\u0438", -1, 1 ),
        new Among ( "\u0438\u043B\u0438", 10, 2 ),
        new Among ( "\u044B\u043B\u0438", 10, 2 ),
        new Among ( "\u0439", -1, 1 ),
        new Among ( "\u0435\u0439", 13, 2 ),
        new Among ( "\u0443\u0439", 13, 2 ),
        new Among ( "\u043B", -1, 1 ),
        new Among ( "\u0438\u043B", 16, 2 ),
        new Among ( "\u044B\u043B", 16, 2 ),
        new Among ( "\u0435\u043C", -1, 1 ),
        new Among ( "\u0438\u043C", -1, 2 ),
        new Among ( "\u044B\u043C", -1, 2 ),
        new Among ( "\u043D", -1, 1 ),
        new Among ( "\u0435\u043D", 22, 2 ),
        new Among ( "\u043B\u043E", -1, 1 ),
        new Among ( "\u0438\u043B\u043E", 24, 2 ),
        new Among ( "\u044B\u043B\u043E", 24, 2 ),
        new Among ( "\u043D\u043E", -1, 1 ),
        new Among ( "\u0435\u043D\u043E", 27, 2 ),
        new Among ( "\u043D\u043D\u043E", 27, 1 ),
        new Among ( "\u0435\u0442", -1, 1 ),
        new Among ( "\u0443\u0435\u0442", 30, 2 ),
        new Among ( "\u0438\u0442", -1, 2 ),
        new Among ( "\u044B\u0442", -1, 2 ),
        new Among ( "\u044E\u0442", -1, 1 ),
        new Among ( "\u0443\u044E\u0442", 34, 2 ),
        new Among ( "\u044F\u0442", -1, 2 ),
        new Among ( "\u043D\u044B", -1, 1 ),
        new Among ( "\u0435\u043D\u044B", 37, 2 ),
        new Among ( "\u0442\u044C", -1, 1 ),
        new Among ( "\u0438\u0442\u044C", 39, 2 ),
        new Among ( "\u044B\u0442\u044C", 39, 2 ),
        new Among ( "\u0435\u0448\u044C", -1, 1 ),
        new Among ( "\u0438\u0448\u044C", -1, 2 ),
        new Among ( "\u044E", -1, 2 ),
        new Among ( "\u0443\u044E", 44, 2 )
    };

    private final static Among a_5[] = {
        new Among ( "\u0430", -1, 1 ),
        new Among ( "\u0435\u0432", -1, 1 ),
        new Among ( "\u043E\u0432", -1, 1 ),
        new Among ( "\u0435", -1, 1 ),
        new Among ( "\u0438\u0435", 3, 1 ),
        new Among ( "\u044C\u0435", 3, 1 ),
        new Among ( "\u0438", -1, 1 ),
        new Among ( "\u0435\u0438", 6, 1 ),
        new Among ( "\u0438\u0438", 6, 1 ),
        new Among ( "\u0430\u043C\u0438", 6, 1 ),
        new Among ( "\u044F\u043C\u0438", 6, 1 ),
        new Among ( "\u0438\u044F\u043C\u0438", 10, 1 ),
        new Among ( "\u0439", -1, 1 ),
        new Among ( "\u0435\u0439", 12, 1 ),
        new Among ( "\u0438\u0435\u0439", 13, 1 ),
        new Among ( "\u0438\u0439", 12, 1 ),
        new Among ( "\u043E\u0439", 12, 1 ),
        new Among ( "\u0430\u043C", -1, 1 ),
        new Among ( "\u0435\u043C", -1, 1 ),
        new Among ( "\u0438\u0435\u043C", 18, 1 ),
        new Among ( "\u043E\u043C", -1, 1 ),
        new Among ( "\u044F\u043C", -1, 1 ),
        new Among ( "\u0438\u044F\u043C", 21, 1 ),
        new Among ( "\u043E", -1, 1 ),
        new Among ( "\u0443", -1, 1 ),
        new Among ( "\u0430\u0445", -1, 1 ),
        new Among ( "\u044F\u0445", -1, 1 ),
        new Among ( "\u0438\u044F\u0445", 26, 1 ),
        new Among ( "\u044B", -1, 1 ),
        new Among ( "\u044C", -1, 1 ),
        new Among ( "\u044E", -1, 1 ),
        new Among ( "\u0438\u044E", 30, 1 ),
        new Among ( "\u044C\u044E", 30, 1 ),
        new Among ( "\u044F", -1, 1 ),
        new Among ( "\u0438\u044F", 33, 1 ),
        new Among ( "\u044C\u044F", 33, 1 )
    };

    private final static Among a_6[] = {
        new Among ( "\u043E\u0441\u0442", -1, 1 ),
        new Among ( "\u043E\u0441\u0442\u044C", -1, 1 )
    };

    private final static Among a_7[] = {
        new Among ( "\u0435\u0439\u0448\u0435", -1, 1 ),
        new Among ( "\u043D", -1, 2 ),
        new Among ( "\u0435\u0439\u0448", -1, 1 ),
        new Among ( "\u044C", -1, 3 )
    };

    private static final char g_v[] = {33, 65, 8, 232 };

    private int I_p2;
    private int I_pV;


    private boolean r_mark_regions() {
        int v_1;
        // (, line 57
        I_pV = limit;
        I_p2 = limit;
        // do, line 61
        v_1 = cursor;
        lab0: do {
            // (, line 61
            // gopast, line 62
            golab1: while(true)
            {
                lab2: do {
                    if (!(in_grouping(g_v, 1072, 1103)))
                    {
                        break lab2;
                    }
                    break golab1;
                } while (false);
                if (cursor >= limit)
                {
                    break lab0;
                }
                cursor++;
            }
            // setmark pV, line 62
            I_pV = cursor;
            // gopast, line 62
            golab3: while(true)
            {
                lab4: do {
                    if (!(out_grouping(g_v, 1072, 1103)))
                    {
                        break lab4;
                    }
                    break golab3;
                } while (false);
                if (cursor >= limit)
                {
                    break lab0;
                }
                cursor++;
            }
            // gopast, line 63
            golab5: while(true)
            {
                lab6: do {
                    if (!(in_grouping(g_v, 1072, 1103)))
                    {
                        break lab6;
                    }
                    break golab5;
                } while (false);
                if (cursor >= limit)
                {
                    break lab0;
                }
                cursor++;
            }
            // gopast, line 63
            golab7: while(true)
            {
                lab8: do {
                    if (!(out_grouping(g_v, 1072, 1103)))
                    {
                        break lab8;
                    }
                    break golab7;
                } while (false);
                if (cursor >= limit)
                {
                    break lab0;
                }
                cursor++;
            }
            // setmark p2, line 63
            I_p2 = cursor;
        } while (false);
        cursor = v_1;
        return true;
    }

    private boolean r_R2() {
        if (!(I_p2 <= cursor))
        {
            return false;
        }
        return true;
    }

    private boolean r_perfective_gerund() {
        int among_var;
        int v_1;
        // (, line 71
        // [, line 72
        ket = cursor;
        // substring, line 72
        among_var = find_among_b(a_0);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 72
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 76
                // or, line 76
                lab0: do {
                    v_1 = limit - cursor;
                    lab1: do {
                        // literal, line 76
                        if (!(eq_s_b("\u0430")))
                        {
                            break lab1;
                        }
                        break lab0;
                    } while (false);
                    cursor = limit - v_1;
                    // literal, line 76
                    if (!(eq_s_b("\u044F")))
                    {
                        return false;
                    }
                } while (false);
                // delete, line 76
                slice_del();
                break;
            case 2:
                // (, line 83
                // delete, line 83
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_adjective() {
        int among_var;
        // (, line 87
        // [, line 88
        ket = cursor;
        // substring, line 88
        among_var = find_among_b(a_1);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 88
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 97
                // delete, line 97
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_adjectival() {
        int among_var;
        int v_1;
        int v_2;
        // (, line 101
        // call adjective, line 102
        if (!r_adjective())
        {
            return false;
        }
        // try, line 109
        v_1 = limit - cursor;
        lab0: do {
            // (, line 109
            // [, line 110
            ket = cursor;
            // substring, line 110
            among_var = find_among_b(a_2);
            if (among_var == 0)
            {
                cursor = limit - v_1;
                break lab0;
            }
            // ], line 110
            bra = cursor;
            switch (among_var) {
                case 0:
                    cursor = limit - v_1;
                    break lab0;
                case 1:
                    // (, line 115
                    // or, line 115
                    lab1: do {
                        v_2 = limit - cursor;
                        lab2: do {
                            // literal, line 115
                            if (!(eq_s_b("\u0430")))
                            {
                                break lab2;
                            }
                            break lab1;
                        } while (false);
                        cursor = limit - v_2;
                        // literal, line 115
                        if (!(eq_s_b("\u044F")))
                        {
                            cursor = limit - v_1;
                            break lab0;
                        }
                    } while (false);
                    // delete, line 115
                    slice_del();
                    break;
                case 2:
                    // (, line 122
                    // delete, line 122
                    slice_del();
                    break;
            }
        } while (false);
        return true;
    }

    private boolean r_reflexive() {
        int among_var;
        // (, line 128
        // [, line 129
        ket = cursor;
        // substring, line 129
        among_var = find_among_b(a_3);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 129
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 132
                // delete, line 132
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_verb() {
        int among_var;
        int v_1;
        // (, line 136
        // [, line 137
        ket = cursor;
        // substring, line 137
        among_var = find_among_b(a_4);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 137
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 143
                // or, line 143
                lab0: do {
                    v_1 = limit - cursor;
                    lab1: do {
                        // literal, line 143
                        if (!(eq_s_b("\u0430")))
                        {
                            break lab1;
                        }
                        break lab0;
                    } while (false);
                    cursor = limit - v_1;
                    // literal, line 143
                    if (!(eq_s_b("\u044F")))
                    {
                        return false;
                    }
                } while (false);
                // delete, line 143
                slice_del();
                break;
            case 2:
                // (, line 151
                // delete, line 151
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_noun() {
        int among_var;
        // (, line 159
        // [, line 160
        ket = cursor;
        // substring, line 160
        among_var = find_among_b(a_5);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 160
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 167
                // delete, line 167
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_derivational() {
        int among_var;
        // (, line 175
        // [, line 176
        ket = cursor;
        // substring, line 176
        among_var = find_among_b(a_6);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 176
        bra = cursor;
        // call R2, line 176
        if (!r_R2())
        {
            return false;
        }
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 179
                // delete, line 179
                slice_del();
                break;
        }
        return true;
    }

    private boolean r_tidy_up() {
        int among_var;
        // (, line 183
        // [, line 184
        ket = cursor;
        // substring, line 184
        among_var = find_among_b(a_7);
        if (among_var == 0)
        {
            return false;
        }
        // ], line 184
        bra = cursor;
        switch (among_var) {
            case 0:
                return false;
            case 1:
                // (, line 188
                // delete, line 188
                slice_del();
                // [, line 189
                ket = cursor;
                // literal, line 189
                if (!(eq_s_b("\u043D")))
                {
                    return false;
                }
                // ], line 189
                bra = cursor;
                // literal, line 189
                if (!(eq_s_b("\u043D")))
                {
                    return false;
                }
                // delete, line 189
                slice_del();
                break;
            case 2:
                // (, line 192
                // literal, line 192
                if (!(eq_s_b("\u043D")))
                {
                    return false;
                }
                // delete, line 192
                slice_del();
                break;
            case 3:
                // (, line 194
                // delete, line 194
                slice_del();
                break;
        }
        return true;
    }

    public boolean stem() {
        int v_1;
        int v_2;
        int v_3;
        int v_4;
        int v_5;
        int v_6;
        int v_7;
        int v_8;
        int v_9;
        int v_10;
        // (, line 199
        // do, line 201
        v_1 = cursor;
        lab0: do {
            // call mark_regions, line 201
            if (!r_mark_regions())
            {
                break lab0;
            }
        } while (false);
        cursor = v_1;
        // backwards, line 202
        limit_backward = cursor; cursor = limit;
        // setlimit, line 202
        v_2 = limit - cursor;
        // tomark, line 202
        if (cursor < I_pV)
        {
            return false;
        }
        cursor = I_pV;
        v_3 = limit_backward;
        limit_backward = cursor;
        cursor = limit - v_2;
        // (, line 202
        // do, line 203
        v_4 = limit - cursor;
        lab1: do {
            // (, line 203
            // or, line 204
            lab2: do {
                v_5 = limit - cursor;
                lab3: do {
                    // call perfective_gerund, line 204
                    if (!r_perfective_gerund())
                    {
                        break lab3;
                    }
                    break lab2;
                } while (false);
                cursor = limit - v_5;
                // (, line 205
                // try, line 205
                v_6 = limit - cursor;
                lab4: do {
                    // call reflexive, line 205
                    if (!r_reflexive())
                    {
                        cursor = limit - v_6;
                        break lab4;
                    }
                } while (false);
                // or, line 206
                lab5: do {
                    v_7 = limit - cursor;
                    lab6: do {
                        // call adjectival, line 206
                        if (!r_adjectival())
                        {
                            break lab6;
                        }
                        break lab5;
                    } while (false);
                    cursor = limit - v_7;
                    lab7: do {
                        // call verb, line 206
                        if (!r_verb())
                        {
                            break lab7;
                        }
                        break lab5;
                    } while (false);
                    cursor = limit - v_7;
                    // call noun, line 206
                    if (!r_noun())
                    {
                        break lab1;
                    }
                } while (false);
            } while (false);
        } while (false);
        cursor = limit - v_4;
        // try, line 209
        v_8 = limit - cursor;
        lab8: do {
            // (, line 209
            // [, line 209
            ket = cursor;
            // literal, line 209
            if (!(eq_s_b("\u0438")))
            {
                cursor = limit - v_8;
                break lab8;
            }
            // ], line 209
            bra = cursor;
            // delete, line 209
            slice_del();
        } while (false);
        // do, line 212
        v_9 = limit - cursor;
        lab9: do {
            // call derivational, line 212
            if (!r_derivational())
            {
                break lab9;
            }
        } while (false);
        cursor = limit - v_9;
        // do, line 213
        v_10 = limit - cursor;
        lab10: do {
            // call tidy_up, line 213
            if (!r_tidy_up())
            {
                break lab10;
            }
        } while (false);
        cursor = limit - v_10;
        limit_backward = v_3;
        cursor = limit_backward;        return true;
    }

    public boolean equals( Object o ) {
        return o instanceof russianStemmer;
    }

    public int hashCode() {
        return russianStemmer.class.getName().hashCode();
    }



}





© 2015 - 2025 Weber Informatics LLC | Privacy Policy