opennlp.tools.stemmer.snowball.porterStemmer Maven / Gradle / Ivy
// CHECKSTYLE:OFF
/*
Copyright (c) 2001, Dr Martin Porter
Copyright (c) 2002, Richard Boulton
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
* Redistributions of source code must retain the above copyright notice,
* this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* Neither the name of the copyright holders nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE
FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
// This file was generated automatically by the Snowball to Java compiler
package opennlp.tools.stemmer.snowball;
/**
* This class was automatically generated by a Snowball to Java compiler
* It implements the stemming algorithm defined by a snowball script.
*/
class porterStemmer extends opennlp.tools.stemmer.snowball.AbstractSnowballStemmer {
private final static porterStemmer methodObject = new porterStemmer ();
private final static Among a_0[] = {
new Among ( "s", -1, 3, "", methodObject ),
new Among ( "ies", 0, 2, "", methodObject ),
new Among ( "sses", 0, 1, "", methodObject ),
new Among ( "ss", 0, -1, "", methodObject )
};
private final static Among a_1[] = {
new Among ( "", -1, 3, "", methodObject ),
new Among ( "bb", 0, 2, "", methodObject ),
new Among ( "dd", 0, 2, "", methodObject ),
new Among ( "ff", 0, 2, "", methodObject ),
new Among ( "gg", 0, 2, "", methodObject ),
new Among ( "bl", 0, 1, "", methodObject ),
new Among ( "mm", 0, 2, "", methodObject ),
new Among ( "nn", 0, 2, "", methodObject ),
new Among ( "pp", 0, 2, "", methodObject ),
new Among ( "rr", 0, 2, "", methodObject ),
new Among ( "at", 0, 1, "", methodObject ),
new Among ( "tt", 0, 2, "", methodObject ),
new Among ( "iz", 0, 1, "", methodObject )
};
private final static Among a_2[] = {
new Among ( "ed", -1, 2, "", methodObject ),
new Among ( "eed", 0, 1, "", methodObject ),
new Among ( "ing", -1, 2, "", methodObject )
};
private final static Among a_3[] = {
new Among ( "anci", -1, 3, "", methodObject ),
new Among ( "enci", -1, 2, "", methodObject ),
new Among ( "abli", -1, 4, "", methodObject ),
new Among ( "eli", -1, 6, "", methodObject ),
new Among ( "alli", -1, 9, "", methodObject ),
new Among ( "ousli", -1, 12, "", methodObject ),
new Among ( "entli", -1, 5, "", methodObject ),
new Among ( "aliti", -1, 10, "", methodObject ),
new Among ( "biliti", -1, 14, "", methodObject ),
new Among ( "iviti", -1, 13, "", methodObject ),
new Among ( "tional", -1, 1, "", methodObject ),
new Among ( "ational", 10, 8, "", methodObject ),
new Among ( "alism", -1, 10, "", methodObject ),
new Among ( "ation", -1, 8, "", methodObject ),
new Among ( "ization", 13, 7, "", methodObject ),
new Among ( "izer", -1, 7, "", methodObject ),
new Among ( "ator", -1, 8, "", methodObject ),
new Among ( "iveness", -1, 13, "", methodObject ),
new Among ( "fulness", -1, 11, "", methodObject ),
new Among ( "ousness", -1, 12, "", methodObject )
};
private final static Among a_4[] = {
new Among ( "icate", -1, 2, "", methodObject ),
new Among ( "ative", -1, 3, "", methodObject ),
new Among ( "alize", -1, 1, "", methodObject ),
new Among ( "iciti", -1, 2, "", methodObject ),
new Among ( "ical", -1, 2, "", methodObject ),
new Among ( "ful", -1, 3, "", methodObject ),
new Among ( "ness", -1, 3, "", methodObject )
};
private final static Among a_5[] = {
new Among ( "ic", -1, 1, "", methodObject ),
new Among ( "ance", -1, 1, "", methodObject ),
new Among ( "ence", -1, 1, "", methodObject ),
new Among ( "able", -1, 1, "", methodObject ),
new Among ( "ible", -1, 1, "", methodObject ),
new Among ( "ate", -1, 1, "", methodObject ),
new Among ( "ive", -1, 1, "", methodObject ),
new Among ( "ize", -1, 1, "", methodObject ),
new Among ( "iti", -1, 1, "", methodObject ),
new Among ( "al", -1, 1, "", methodObject ),
new Among ( "ism", -1, 1, "", methodObject ),
new Among ( "ion", -1, 2, "", methodObject ),
new Among ( "er", -1, 1, "", methodObject ),
new Among ( "ous", -1, 1, "", methodObject ),
new Among ( "ant", -1, 1, "", methodObject ),
new Among ( "ent", -1, 1, "", methodObject ),
new Among ( "ment", 15, 1, "", methodObject ),
new Among ( "ement", 16, 1, "", methodObject ),
new Among ( "ou", -1, 1, "", methodObject )
};
private static final char g_v[] = {17, 65, 16, 1 };
private static final char g_v_WXY[] = {1, 17, 65, 208, 1 };
private boolean B_Y_found;
private int I_p2;
private int I_p1;
private void copy_from(porterStemmer other) {
B_Y_found = other.B_Y_found;
I_p2 = other.I_p2;
I_p1 = other.I_p1;
super.copy_from(other);
}
private boolean r_shortv() {
// (, line 19
if (!(out_grouping_b(g_v_WXY, 89, 121)))
{
return false;
}
if (!(in_grouping_b(g_v, 97, 121)))
{
return false;
}
if (!(out_grouping_b(g_v, 97, 121)))
{
return false;
}
return true;
}
private boolean r_R1() {
if (!(I_p1 <= cursor))
{
return false;
}
return true;
}
private boolean r_R2() {
if (!(I_p2 <= cursor))
{
return false;
}
return true;
}
private boolean r_Step_1a() {
int among_var;
// (, line 24
// [, line 25
ket = cursor;
// substring, line 25
among_var = find_among_b(a_0, 4);
if (among_var == 0)
{
return false;
}
// ], line 25
bra = cursor;
switch(among_var) {
case 0:
return false;
case 1:
// (, line 26
// <-, line 26
slice_from("ss");
break;
case 2:
// (, line 27
// <-, line 27
slice_from("i");
break;
case 3:
// (, line 29
// delete, line 29
slice_del();
break;
}
return true;
}
private boolean r_Step_1b() {
int among_var;
int v_1;
int v_3;
int v_4;
// (, line 33
// [, line 34
ket = cursor;
// substring, line 34
among_var = find_among_b(a_2, 3);
if (among_var == 0)
{
return false;
}
// ], line 34
bra = cursor;
switch(among_var) {
case 0:
return false;
case 1:
// (, line 35
// call R1, line 35
if (!r_R1())
{
return false;
}
// <-, line 35
slice_from("ee");
break;
case 2:
// (, line 37
// test, line 38
v_1 = limit - cursor;
// gopast, line 38
golab0: while(true)
{
lab1: do {
if (!(in_grouping_b(g_v, 97, 121)))
{
break lab1;
}
break golab0;
} while (false);
if (cursor <= limit_backward)
{
return false;
}
cursor--;
}
cursor = limit - v_1;
// delete, line 38
slice_del();
// test, line 39
v_3 = limit - cursor;
// substring, line 39
among_var = find_among_b(a_1, 13);
if (among_var == 0)
{
return false;
}
cursor = limit - v_3;
switch(among_var) {
case 0:
return false;
case 1:
// (, line 41
// <+, line 41
{
int c = cursor;
insert(cursor, cursor, "e");
cursor = c;
}
break;
case 2:
// (, line 44
// [, line 44
ket = cursor;
// next, line 44
if (cursor <= limit_backward)
{
return false;
}
cursor--;
// ], line 44
bra = cursor;
// delete, line 44
slice_del();
break;
case 3:
// (, line 45
// atmark, line 45
if (cursor != I_p1)
{
return false;
}
// test, line 45
v_4 = limit - cursor;
// call shortv, line 45
if (!r_shortv())
{
return false;
}
cursor = limit - v_4;
// <+, line 45
{
int c = cursor;
insert(cursor, cursor, "e");
cursor = c;
}
break;
}
break;
}
return true;
}
private boolean r_Step_1c() {
int v_1;
// (, line 51
// [, line 52
ket = cursor;
// or, line 52
lab0: do {
v_1 = limit - cursor;
lab1: do {
// literal, line 52
if (!(eq_s_b(1, "y")))
{
break lab1;
}
break lab0;
} while (false);
cursor = limit - v_1;
// literal, line 52
if (!(eq_s_b(1, "Y")))
{
return false;
}
} while (false);
// ], line 52
bra = cursor;
// gopast, line 53
golab2: while(true)
{
lab3: do {
if (!(in_grouping_b(g_v, 97, 121)))
{
break lab3;
}
break golab2;
} while (false);
if (cursor <= limit_backward)
{
return false;
}
cursor--;
}
// <-, line 54
slice_from("i");
return true;
}
private boolean r_Step_2() {
int among_var;
// (, line 57
// [, line 58
ket = cursor;
// substring, line 58
among_var = find_among_b(a_3, 20);
if (among_var == 0)
{
return false;
}
// ], line 58
bra = cursor;
// call R1, line 58
if (!r_R1())
{
return false;
}
switch(among_var) {
case 0:
return false;
case 1:
// (, line 59
// <-, line 59
slice_from("tion");
break;
case 2:
// (, line 60
// <-, line 60
slice_from("ence");
break;
case 3:
// (, line 61
// <-, line 61
slice_from("ance");
break;
case 4:
// (, line 62
// <-, line 62
slice_from("able");
break;
case 5:
// (, line 63
// <-, line 63
slice_from("ent");
break;
case 6:
// (, line 64
// <-, line 64
slice_from("e");
break;
case 7:
// (, line 66
// <-, line 66
slice_from("ize");
break;
case 8:
// (, line 68
// <-, line 68
slice_from("ate");
break;
case 9:
// (, line 69
// <-, line 69
slice_from("al");
break;
case 10:
// (, line 71
// <-, line 71
slice_from("al");
break;
case 11:
// (, line 72
// <-, line 72
slice_from("ful");
break;
case 12:
// (, line 74
// <-, line 74
slice_from("ous");
break;
case 13:
// (, line 76
// <-, line 76
slice_from("ive");
break;
case 14:
// (, line 77
// <-, line 77
slice_from("ble");
break;
}
return true;
}
private boolean r_Step_3() {
int among_var;
// (, line 81
// [, line 82
ket = cursor;
// substring, line 82
among_var = find_among_b(a_4, 7);
if (among_var == 0)
{
return false;
}
// ], line 82
bra = cursor;
// call R1, line 82
if (!r_R1())
{
return false;
}
switch(among_var) {
case 0:
return false;
case 1:
// (, line 83
// <-, line 83
slice_from("al");
break;
case 2:
// (, line 85
// <-, line 85
slice_from("ic");
break;
case 3:
// (, line 87
// delete, line 87
slice_del();
break;
}
return true;
}
private boolean r_Step_4() {
int among_var;
int v_1;
// (, line 91
// [, line 92
ket = cursor;
// substring, line 92
among_var = find_among_b(a_5, 19);
if (among_var == 0)
{
return false;
}
// ], line 92
bra = cursor;
// call R2, line 92
if (!r_R2())
{
return false;
}
switch(among_var) {
case 0:
return false;
case 1:
// (, line 95
// delete, line 95
slice_del();
break;
case 2:
// (, line 96
// or, line 96
lab0: do {
v_1 = limit - cursor;
lab1: do {
// literal, line 96
if (!(eq_s_b(1, "s")))
{
break lab1;
}
break lab0;
} while (false);
cursor = limit - v_1;
// literal, line 96
if (!(eq_s_b(1, "t")))
{
return false;
}
} while (false);
// delete, line 96
slice_del();
break;
}
return true;
}
private boolean r_Step_5a() {
int v_1;
int v_2;
// (, line 100
// [, line 101
ket = cursor;
// literal, line 101
if (!(eq_s_b(1, "e")))
{
return false;
}
// ], line 101
bra = cursor;
// or, line 102
lab0: do {
v_1 = limit - cursor;
lab1: do {
// call R2, line 102
if (!r_R2())
{
break lab1;
}
break lab0;
} while (false);
cursor = limit - v_1;
// (, line 102
// call R1, line 102
if (!r_R1())
{
return false;
}
// not, line 102
{
v_2 = limit - cursor;
lab2: do {
// call shortv, line 102
if (!r_shortv())
{
break lab2;
}
return false;
} while (false);
cursor = limit - v_2;
}
} while (false);
// delete, line 103
slice_del();
return true;
}
private boolean r_Step_5b() {
// (, line 106
// [, line 107
ket = cursor;
// literal, line 107
if (!(eq_s_b(1, "l")))
{
return false;
}
// ], line 107
bra = cursor;
// call R2, line 108
if (!r_R2())
{
return false;
}
// literal, line 108
if (!(eq_s_b(1, "l")))
{
return false;
}
// delete, line 109
slice_del();
return true;
}
public boolean stem() {
int v_1;
int v_2;
int v_3;
int v_4;
int v_5;
int v_10;
int v_11;
int v_12;
int v_13;
int v_14;
int v_15;
int v_16;
int v_17;
int v_18;
int v_19;
int v_20;
// (, line 113
// unset Y_found, line 115
B_Y_found = false;
// do, line 116
v_1 = cursor;
lab0: do {
// (, line 116
// [, line 116
bra = cursor;
// literal, line 116
if (!(eq_s(1, "y")))
{
break lab0;
}
// ], line 116
ket = cursor;
// <-, line 116
slice_from("Y");
// set Y_found, line 116
B_Y_found = true;
} while (false);
cursor = v_1;
// do, line 117
v_2 = cursor;
lab1: do {
// repeat, line 117
replab2: while(true)
{
v_3 = cursor;
lab3: do {
// (, line 117
// goto, line 117
golab4: while(true)
{
v_4 = cursor;
lab5: do {
// (, line 117
if (!(in_grouping(g_v, 97, 121)))
{
break lab5;
}
// [, line 117
bra = cursor;
// literal, line 117
if (!(eq_s(1, "y")))
{
break lab5;
}
// ], line 117
ket = cursor;
cursor = v_4;
break golab4;
} while (false);
cursor = v_4;
if (cursor >= limit)
{
break lab3;
}
cursor++;
}
// <-, line 117
slice_from("Y");
// set Y_found, line 117
B_Y_found = true;
continue replab2;
} while (false);
cursor = v_3;
break replab2;
}
} while (false);
cursor = v_2;
I_p1 = limit;
I_p2 = limit;
// do, line 121
v_5 = cursor;
lab6: do {
// (, line 121
// gopast, line 122
golab7: while(true)
{
lab8: do {
if (!(in_grouping(g_v, 97, 121)))
{
break lab8;
}
break golab7;
} while (false);
if (cursor >= limit)
{
break lab6;
}
cursor++;
}
// gopast, line 122
golab9: while(true)
{
lab10: do {
if (!(out_grouping(g_v, 97, 121)))
{
break lab10;
}
break golab9;
} while (false);
if (cursor >= limit)
{
break lab6;
}
cursor++;
}
// setmark p1, line 122
I_p1 = cursor;
// gopast, line 123
golab11: while(true)
{
lab12: do {
if (!(in_grouping(g_v, 97, 121)))
{
break lab12;
}
break golab11;
} while (false);
if (cursor >= limit)
{
break lab6;
}
cursor++;
}
// gopast, line 123
golab13: while(true)
{
lab14: do {
if (!(out_grouping(g_v, 97, 121)))
{
break lab14;
}
break golab13;
} while (false);
if (cursor >= limit)
{
break lab6;
}
cursor++;
}
// setmark p2, line 123
I_p2 = cursor;
} while (false);
cursor = v_5;
// backwards, line 126
limit_backward = cursor; cursor = limit;
// (, line 126
// do, line 127
v_10 = limit - cursor;
lab15: do {
// call Step_1a, line 127
if (!r_Step_1a())
{
break lab15;
}
} while (false);
cursor = limit - v_10;
// do, line 128
v_11 = limit - cursor;
lab16: do {
// call Step_1b, line 128
if (!r_Step_1b())
{
break lab16;
}
} while (false);
cursor = limit - v_11;
// do, line 129
v_12 = limit - cursor;
lab17: do {
// call Step_1c, line 129
if (!r_Step_1c())
{
break lab17;
}
} while (false);
cursor = limit - v_12;
// do, line 130
v_13 = limit - cursor;
lab18: do {
// call Step_2, line 130
if (!r_Step_2())
{
break lab18;
}
} while (false);
cursor = limit - v_13;
// do, line 131
v_14 = limit - cursor;
lab19: do {
// call Step_3, line 131
if (!r_Step_3())
{
break lab19;
}
} while (false);
cursor = limit - v_14;
// do, line 132
v_15 = limit - cursor;
lab20: do {
// call Step_4, line 132
if (!r_Step_4())
{
break lab20;
}
} while (false);
cursor = limit - v_15;
// do, line 133
v_16 = limit - cursor;
lab21: do {
// call Step_5a, line 133
if (!r_Step_5a())
{
break lab21;
}
} while (false);
cursor = limit - v_16;
// do, line 134
v_17 = limit - cursor;
lab22: do {
// call Step_5b, line 134
if (!r_Step_5b())
{
break lab22;
}
} while (false);
cursor = limit - v_17;
cursor = limit_backward; // do, line 137
v_18 = cursor;
lab23: do {
// (, line 137
// Boolean test Y_found, line 137
if (!(B_Y_found))
{
break lab23;
}
// repeat, line 137
replab24: while(true)
{
v_19 = cursor;
lab25: do {
// (, line 137
// goto, line 137
golab26: while(true)
{
v_20 = cursor;
lab27: do {
// (, line 137
// [, line 137
bra = cursor;
// literal, line 137
if (!(eq_s(1, "Y")))
{
break lab27;
}
// ], line 137
ket = cursor;
cursor = v_20;
break golab26;
} while (false);
cursor = v_20;
if (cursor >= limit)
{
break lab25;
}
cursor++;
}
// <-, line 137
slice_from("y");
continue replab24;
} while (false);
cursor = v_19;
break replab24;
}
} while (false);
cursor = v_18;
return true;
}
public boolean equals( Object o ) {
return o instanceof porterStemmer;
}
public int hashCode() {
return porterStemmer.class.getName().hashCode();
}
}