All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.tartarus.snowball.ext.russianStemmer Maven / Gradle / Ivy

Go to download

The S-Space Package is a collection of algorithms for building Semantic Spaces as well as a highly-scalable library for designing new distributional semantics algorithms. Distributional algorithms process text corpora and represent the semantic for words as high dimensional feature vectors. This package also includes matrices, vectors, and numerous clustering algorithms. These approaches are known by many names, such as word spaces, semantic spaces, or distributed semantics and rest upon the Distributional Hypothesis: words that appear in similar contexts have similar meanings.

The newest version!
// This file was generated automatically by the Snowball to Java compiler

package org.tartarus.snowball.ext;

import org.tartarus.snowball.Among;

 /**
  * This class was automatically generated by a Snowball to Java compiler 
  * It implements the stemming algorithm defined by a snowball script.
  */

public class russianStemmer extends org.tartarus.snowball.SnowballStemmer {

private static final long serialVersionUID = 1L;

        private final static russianStemmer methodObject = new russianStemmer ();

                private final static Among a_0[] = {
                    new Among ( "\u0432", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0432", 0, 2, "", methodObject ),
                    new Among ( "\u044B\u0432", 0, 2, "", methodObject ),
                    new Among ( "\u0432\u0448\u0438", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0432\u0448\u0438", 3, 2, "", methodObject ),
                    new Among ( "\u044B\u0432\u0448\u0438", 3, 2, "", methodObject ),
                    new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject ),
                    new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject )
                };

                private final static Among a_1[] = {
                    new Among ( "\u0435\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u044B\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043C\u0438", -1, 1, "", methodObject ),
                    new Among ( "\u044B\u043C\u0438", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u044B\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u044B\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0433\u043E", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u0433\u043E", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043C\u0443", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u043C\u0443", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0445", -1, 1, "", methodObject ),
                    new Among ( "\u044B\u0445", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u044E", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u044E", -1, 1, "", methodObject ),
                    new Among ( "\u0443\u044E", -1, 1, "", methodObject ),
                    new Among ( "\u044E\u044E", -1, 1, "", methodObject ),
                    new Among ( "\u0430\u044F", -1, 1, "", methodObject ),
                    new Among ( "\u044F\u044F", -1, 1, "", methodObject )
                };

                private final static Among a_2[] = {
                    new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u043D\u043D", -1, 1, "", methodObject ),
                    new Among ( "\u0432\u0448", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0432\u0448", 2, 2, "", methodObject ),
                    new Among ( "\u044B\u0432\u0448", 2, 2, "", methodObject ),
                    new Among ( "\u0449", -1, 1, "", methodObject ),
                    new Among ( "\u044E\u0449", 5, 1, "", methodObject ),
                    new Among ( "\u0443\u044E\u0449", 6, 2, "", methodObject )
                };

                private final static Among a_3[] = {
                    new Among ( "\u0441\u044C", -1, 1, "", methodObject ),
                    new Among ( "\u0441\u044F", -1, 1, "", methodObject )
                };

                private final static Among a_4[] = {
                    new Among ( "\u043B\u0430", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043B\u0430", 0, 2, "", methodObject ),
                    new Among ( "\u044B\u043B\u0430", 0, 2, "", methodObject ),
                    new Among ( "\u043D\u0430", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043D\u0430", 3, 2, "", methodObject ),
                    new Among ( "\u0435\u0442\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0442\u0435", -1, 2, "", methodObject ),
                    new Among ( "\u0439\u0442\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0439\u0442\u0435", 7, 2, "", methodObject ),
                    new Among ( "\u0443\u0439\u0442\u0435", 7, 2, "", methodObject ),
                    new Among ( "\u043B\u0438", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043B\u0438", 10, 2, "", methodObject ),
                    new Among ( "\u044B\u043B\u0438", 10, 2, "", methodObject ),
                    new Among ( "\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0439", 13, 2, "", methodObject ),
                    new Among ( "\u0443\u0439", 13, 2, "", methodObject ),
                    new Among ( "\u043B", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043B", 16, 2, "", methodObject ),
                    new Among ( "\u044B\u043B", 16, 2, "", methodObject ),
                    new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043C", -1, 2, "", methodObject ),
                    new Among ( "\u044B\u043C", -1, 2, "", methodObject ),
                    new Among ( "\u043D", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043D", 22, 2, "", methodObject ),
                    new Among ( "\u043B\u043E", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u043B\u043E", 24, 2, "", methodObject ),
                    new Among ( "\u044B\u043B\u043E", 24, 2, "", methodObject ),
                    new Among ( "\u043D\u043E", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043D\u043E", 27, 2, "", methodObject ),
                    new Among ( "\u043D\u043D\u043E", 27, 1, "", methodObject ),
                    new Among ( "\u0435\u0442", -1, 1, "", methodObject ),
                    new Among ( "\u0443\u0435\u0442", 30, 2, "", methodObject ),
                    new Among ( "\u0438\u0442", -1, 2, "", methodObject ),
                    new Among ( "\u044B\u0442", -1, 2, "", methodObject ),
                    new Among ( "\u044E\u0442", -1, 1, "", methodObject ),
                    new Among ( "\u0443\u044E\u0442", 34, 2, "", methodObject ),
                    new Among ( "\u044F\u0442", -1, 2, "", methodObject ),
                    new Among ( "\u043D\u044B", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043D\u044B", 37, 2, "", methodObject ),
                    new Among ( "\u0442\u044C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0442\u044C", 39, 2, "", methodObject ),
                    new Among ( "\u044B\u0442\u044C", 39, 2, "", methodObject ),
                    new Among ( "\u0435\u0448\u044C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0448\u044C", -1, 2, "", methodObject ),
                    new Among ( "\u044E", -1, 2, "", methodObject ),
                    new Among ( "\u0443\u044E", 44, 2, "", methodObject )
                };

                private final static Among a_5[] = {
                    new Among ( "\u0430", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0432", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u0432", -1, 1, "", methodObject ),
                    new Among ( "\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0435", 3, 1, "", methodObject ),
                    new Among ( "\u044C\u0435", 3, 1, "", methodObject ),
                    new Among ( "\u0438", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0438", 6, 1, "", methodObject ),
                    new Among ( "\u0438\u0438", 6, 1, "", methodObject ),
                    new Among ( "\u0430\u043C\u0438", 6, 1, "", methodObject ),
                    new Among ( "\u044F\u043C\u0438", 6, 1, "", methodObject ),
                    new Among ( "\u0438\u044F\u043C\u0438", 10, 1, "", methodObject ),
                    new Among ( "\u0439", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u0439", 12, 1, "", methodObject ),
                    new Among ( "\u0438\u0435\u0439", 13, 1, "", methodObject ),
                    new Among ( "\u0438\u0439", 12, 1, "", methodObject ),
                    new Among ( "\u043E\u0439", 12, 1, "", methodObject ),
                    new Among ( "\u0430\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u0435\u043C", 18, 1, "", methodObject ),
                    new Among ( "\u043E\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u044F\u043C", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u044F\u043C", 21, 1, "", methodObject ),
                    new Among ( "\u043E", -1, 1, "", methodObject ),
                    new Among ( "\u0443", -1, 1, "", methodObject ),
                    new Among ( "\u0430\u0445", -1, 1, "", methodObject ),
                    new Among ( "\u044F\u0445", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u044F\u0445", 26, 1, "", methodObject ),
                    new Among ( "\u044B", -1, 1, "", methodObject ),
                    new Among ( "\u044C", -1, 1, "", methodObject ),
                    new Among ( "\u044E", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u044E", 30, 1, "", methodObject ),
                    new Among ( "\u044C\u044E", 30, 1, "", methodObject ),
                    new Among ( "\u044F", -1, 1, "", methodObject ),
                    new Among ( "\u0438\u044F", 33, 1, "", methodObject ),
                    new Among ( "\u044C\u044F", 33, 1, "", methodObject )
                };

                private final static Among a_6[] = {
                    new Among ( "\u043E\u0441\u0442", -1, 1, "", methodObject ),
                    new Among ( "\u043E\u0441\u0442\u044C", -1, 1, "", methodObject )
                };

                private final static Among a_7[] = {
                    new Among ( "\u0435\u0439\u0448\u0435", -1, 1, "", methodObject ),
                    new Among ( "\u043D", -1, 2, "", methodObject ),
                    new Among ( "\u0435\u0439\u0448", -1, 1, "", methodObject ),
                    new Among ( "\u044C", -1, 3, "", methodObject )
                };

                private static final char g_v[] = {33, 65, 8, 232 };

        private int I_p2;
        private int I_pV;

                private void copy_from(russianStemmer other) {
                    I_p2 = other.I_p2;
                    I_pV = other.I_pV;
                    super.copy_from(other);
                }

                private boolean r_mark_regions() {
            int v_1;
                    // (, line 57
                    I_pV = limit;
                    I_p2 = limit;
                    // do, line 61
                    v_1 = cursor;
                    lab0: do {
                        // (, line 61
                        // gopast, line 62
                        golab1: while(true)
                        {
                            lab2: do {
                                if (!(in_grouping(g_v, 1072, 1103)))
                                {
                                    break lab2;
                                }
                                break golab1;
                            } while (false);
                            if (cursor >= limit)
                            {
                                break lab0;
                            }
                            cursor++;
                        }
                        // setmark pV, line 62
                        I_pV = cursor;
                        // gopast, line 62
                        golab3: while(true)
                        {
                            lab4: do {
                                if (!(out_grouping(g_v, 1072, 1103)))
                                {
                                    break lab4;
                                }
                                break golab3;
                            } while (false);
                            if (cursor >= limit)
                            {
                                break lab0;
                            }
                            cursor++;
                        }
                        // gopast, line 63
                        golab5: while(true)
                        {
                            lab6: do {
                                if (!(in_grouping(g_v, 1072, 1103)))
                                {
                                    break lab6;
                                }
                                break golab5;
                            } while (false);
                            if (cursor >= limit)
                            {
                                break lab0;
                            }
                            cursor++;
                        }
                        // gopast, line 63
                        golab7: while(true)
                        {
                            lab8: do {
                                if (!(out_grouping(g_v, 1072, 1103)))
                                {
                                    break lab8;
                                }
                                break golab7;
                            } while (false);
                            if (cursor >= limit)
                            {
                                break lab0;
                            }
                            cursor++;
                        }
                        // setmark p2, line 63
                        I_p2 = cursor;
                    } while (false);
                    cursor = v_1;
                    return true;
                }

                private boolean r_R2() {
                    if (!(I_p2 <= cursor))
                    {
                        return false;
                    }
                    return true;
                }

                private boolean r_perfective_gerund() {
            int among_var;
            int v_1;
                    // (, line 71
                    // [, line 72
                    ket = cursor;
                    // substring, line 72
                    among_var = find_among_b(a_0, 9);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 72
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 76
                            // or, line 76
                            lab0: do {
                                v_1 = limit - cursor;
                                lab1: do {
                                    // literal, line 76
                                    if (!(eq_s_b(1, "\u0430")))
                                    {
                                        break lab1;
                                    }
                                    break lab0;
                                } while (false);
                                cursor = limit - v_1;
                                // literal, line 76
                                if (!(eq_s_b(1, "\u044F")))
                                {
                                    return false;
                                }
                            } while (false);
                            // delete, line 76
                            slice_del();
                            break;
                        case 2:
                            // (, line 83
                            // delete, line 83
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_adjective() {
            int among_var;
                    // (, line 87
                    // [, line 88
                    ket = cursor;
                    // substring, line 88
                    among_var = find_among_b(a_1, 26);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 88
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 97
                            // delete, line 97
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_adjectival() {
            int among_var;
            int v_1;
            int v_2;
                    // (, line 101
                    // call adjective, line 102
                    if (!r_adjective())
                    {
                        return false;
                    }
                    // try, line 109
                    v_1 = limit - cursor;
                    lab0: do {
                        // (, line 109
                        // [, line 110
                        ket = cursor;
                        // substring, line 110
                        among_var = find_among_b(a_2, 8);
                        if (among_var == 0)
                        {
                            cursor = limit - v_1;
                            break lab0;
                        }
                        // ], line 110
                        bra = cursor;
                        switch(among_var) {
                            case 0:
                                cursor = limit - v_1;
                                break lab0;
                            case 1:
                                // (, line 115
                                // or, line 115
                                lab1: do {
                                    v_2 = limit - cursor;
                                    lab2: do {
                                        // literal, line 115
                                        if (!(eq_s_b(1, "\u0430")))
                                        {
                                            break lab2;
                                        }
                                        break lab1;
                                    } while (false);
                                    cursor = limit - v_2;
                                    // literal, line 115
                                    if (!(eq_s_b(1, "\u044F")))
                                    {
                                        cursor = limit - v_1;
                                        break lab0;
                                    }
                                } while (false);
                                // delete, line 115
                                slice_del();
                                break;
                            case 2:
                                // (, line 122
                                // delete, line 122
                                slice_del();
                                break;
                        }
                    } while (false);
                    return true;
                }

                private boolean r_reflexive() {
            int among_var;
                    // (, line 128
                    // [, line 129
                    ket = cursor;
                    // substring, line 129
                    among_var = find_among_b(a_3, 2);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 129
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 132
                            // delete, line 132
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_verb() {
            int among_var;
            int v_1;
                    // (, line 136
                    // [, line 137
                    ket = cursor;
                    // substring, line 137
                    among_var = find_among_b(a_4, 46);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 137
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 143
                            // or, line 143
                            lab0: do {
                                v_1 = limit - cursor;
                                lab1: do {
                                    // literal, line 143
                                    if (!(eq_s_b(1, "\u0430")))
                                    {
                                        break lab1;
                                    }
                                    break lab0;
                                } while (false);
                                cursor = limit - v_1;
                                // literal, line 143
                                if (!(eq_s_b(1, "\u044F")))
                                {
                                    return false;
                                }
                            } while (false);
                            // delete, line 143
                            slice_del();
                            break;
                        case 2:
                            // (, line 151
                            // delete, line 151
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_noun() {
            int among_var;
                    // (, line 159
                    // [, line 160
                    ket = cursor;
                    // substring, line 160
                    among_var = find_among_b(a_5, 36);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 160
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 167
                            // delete, line 167
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_derivational() {
            int among_var;
                    // (, line 175
                    // [, line 176
                    ket = cursor;
                    // substring, line 176
                    among_var = find_among_b(a_6, 2);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 176
                    bra = cursor;
                    // call R2, line 176
                    if (!r_R2())
                    {
                        return false;
                    }
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 179
                            // delete, line 179
                            slice_del();
                            break;
                    }
                    return true;
                }

                private boolean r_tidy_up() {
            int among_var;
                    // (, line 183
                    // [, line 184
                    ket = cursor;
                    // substring, line 184
                    among_var = find_among_b(a_7, 4);
                    if (among_var == 0)
                    {
                        return false;
                    }
                    // ], line 184
                    bra = cursor;
                    switch(among_var) {
                        case 0:
                            return false;
                        case 1:
                            // (, line 188
                            // delete, line 188
                            slice_del();
                            // [, line 189
                            ket = cursor;
                            // literal, line 189
                            if (!(eq_s_b(1, "\u043D")))
                            {
                                return false;
                            }
                            // ], line 189
                            bra = cursor;
                            // literal, line 189
                            if (!(eq_s_b(1, "\u043D")))
                            {
                                return false;
                            }
                            // delete, line 189
                            slice_del();
                            break;
                        case 2:
                            // (, line 192
                            // literal, line 192
                            if (!(eq_s_b(1, "\u043D")))
                            {
                                return false;
                            }
                            // delete, line 192
                            slice_del();
                            break;
                        case 3:
                            // (, line 194
                            // delete, line 194
                            slice_del();
                            break;
                    }
                    return true;
                }

                public boolean stem() {
            int v_1;
            int v_2;
            int v_3;
            int v_4;
            int v_5;
            int v_6;
            int v_7;
            int v_8;
            int v_9;
            int v_10;
                    // (, line 199
                    // do, line 201
                    v_1 = cursor;
                    lab0: do {
                        // call mark_regions, line 201
                        if (!r_mark_regions())
                        {
                            break lab0;
                        }
                    } while (false);
                    cursor = v_1;
                    // backwards, line 202
                    limit_backward = cursor; cursor = limit;
                    // setlimit, line 202
                    v_2 = limit - cursor;
                    // tomark, line 202
                    if (cursor < I_pV)
                    {
                        return false;
                    }
                    cursor = I_pV;
                    v_3 = limit_backward;
                    limit_backward = cursor;
                    cursor = limit - v_2;
                    // (, line 202
                    // do, line 203
                    v_4 = limit - cursor;
                    lab1: do {
                        // (, line 203
                        // or, line 204
                        lab2: do {
                            v_5 = limit - cursor;
                            lab3: do {
                                // call perfective_gerund, line 204
                                if (!r_perfective_gerund())
                                {
                                    break lab3;
                                }
                                break lab2;
                            } while (false);
                            cursor = limit - v_5;
                            // (, line 205
                            // try, line 205
                            v_6 = limit - cursor;
                            lab4: do {
                                // call reflexive, line 205
                                if (!r_reflexive())
                                {
                                    cursor = limit - v_6;
                                    break lab4;
                                }
                            } while (false);
                            // or, line 206
                            lab5: do {
                                v_7 = limit - cursor;
                                lab6: do {
                                    // call adjectival, line 206
                                    if (!r_adjectival())
                                    {
                                        break lab6;
                                    }
                                    break lab5;
                                } while (false);
                                cursor = limit - v_7;
                                lab7: do {
                                    // call verb, line 206
                                    if (!r_verb())
                                    {
                                        break lab7;
                                    }
                                    break lab5;
                                } while (false);
                                cursor = limit - v_7;
                                // call noun, line 206
                                if (!r_noun())
                                {
                                    break lab1;
                                }
                            } while (false);
                        } while (false);
                    } while (false);
                    cursor = limit - v_4;
                    // try, line 209
                    v_8 = limit - cursor;
                    lab8: do {
                        // (, line 209
                        // [, line 209
                        ket = cursor;
                        // literal, line 209
                        if (!(eq_s_b(1, "\u0438")))
                        {
                            cursor = limit - v_8;
                            break lab8;
                        }
                        // ], line 209
                        bra = cursor;
                        // delete, line 209
                        slice_del();
                    } while (false);
                    // do, line 212
                    v_9 = limit - cursor;
                    lab9: do {
                        // call derivational, line 212
                        if (!r_derivational())
                        {
                            break lab9;
                        }
                    } while (false);
                    cursor = limit - v_9;
                    // do, line 213
                    v_10 = limit - cursor;
                    lab10: do {
                        // call tidy_up, line 213
                        if (!r_tidy_up())
                        {
                            break lab10;
                        }
                    } while (false);
                    cursor = limit - v_10;
                    limit_backward = v_3;
                    cursor = limit_backward;                    return true;
                }

        public boolean equals( Object o ) {
            return o instanceof russianStemmer;
        }

        public int hashCode() {
            return russianStemmer.class.getName().hashCode();
        }



}





© 2015 - 2024 Weber Informatics LLC | Privacy Policy