|
|
|
/*
|
|
|
|
* Port of Snowball stemmers on C#
|
|
|
|
* Original stemmers can be found on http://snowball.tartarus.org
|
|
|
|
* Licence still BSD: http://snowball.tartarus.org/license.php
|
|
|
|
*
|
|
|
|
* Most of stemmers are ported from Java by Iveonik Systems ltd. (www.iveonik.com)
|
|
|
|
*/
|
|
|
|
|
|
|
|
using ZeroLevel.Services.Semantic;
|
|
|
|
|
|
|
|
namespace Iveonik.Stemmers
|
|
|
|
{
|
|
|
|
public class RussianStemmer : StemmerOperations, ILexer
|
|
|
|
{
|
|
|
|
private readonly static RussianStemmer methodObject = new RussianStemmer();
|
|
|
|
|
|
|
|
private readonly static Among[] a_0 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0432", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0432", 0, 2, null ),
|
|
|
|
new Among ( "\u044B\u0432", 0, 2, null ),
|
|
|
|
new Among ( "\u0432\u0448\u0438", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0432\u0448\u0438", 3, 2, null ),
|
|
|
|
new Among ( "\u044B\u0432\u0448\u0438", 3, 2, null ),
|
|
|
|
new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, null ),
|
|
|
|
new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_1 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0435\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u044B\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043C\u0438", -1, 1, null ),
|
|
|
|
new Among ( "\u044B\u043C\u0438", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u044B\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u044B\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0433\u043E", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u0433\u043E", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043C\u0443", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u043C\u0443", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0445", -1, 1, null ),
|
|
|
|
new Among ( "\u044B\u0445", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u044E", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u044E", -1, 1, null ),
|
|
|
|
new Among ( "\u0443\u044E", -1, 1, null ),
|
|
|
|
new Among ( "\u044E\u044E", -1, 1, null ),
|
|
|
|
new Among ( "\u0430\u044F", -1, 1, null ),
|
|
|
|
new Among ( "\u044F\u044F", -1, 1, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_2 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0435\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u043D\u043D", -1, 1, null ),
|
|
|
|
new Among ( "\u0432\u0448", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0432\u0448", 2, 2, null ),
|
|
|
|
new Among ( "\u044B\u0432\u0448", 2, 2, null ),
|
|
|
|
new Among ( "\u0449", -1, 1, null ),
|
|
|
|
new Among ( "\u044E\u0449", 5, 1, null ),
|
|
|
|
new Among ( "\u0443\u044E\u0449", 6, 2, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_3 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0441\u044C", -1, 1, null ),
|
|
|
|
new Among ( "\u0441\u044F", -1, 1, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_4 =
|
|
|
|
{
|
|
|
|
new Among ( "\u043B\u0430", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043B\u0430", 0, 2, null ),
|
|
|
|
new Among ( "\u044B\u043B\u0430", 0, 2, null ),
|
|
|
|
new Among ( "\u043D\u0430", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043D\u0430", 3, 2, null ),
|
|
|
|
new Among ( "\u0435\u0442\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0442\u0435", -1, 2, null ),
|
|
|
|
new Among ( "\u0439\u0442\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0439\u0442\u0435", 7, 2, null ),
|
|
|
|
new Among ( "\u0443\u0439\u0442\u0435", 7, 2, null ),
|
|
|
|
new Among ( "\u043B\u0438", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043B\u0438", 10, 2, null ),
|
|
|
|
new Among ( "\u044B\u043B\u0438", 10, 2, null ),
|
|
|
|
new Among ( "\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0439", 13, 2, null ),
|
|
|
|
new Among ( "\u0443\u0439", 13, 2, null ),
|
|
|
|
new Among ( "\u043B", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043B", 16, 2, null ),
|
|
|
|
new Among ( "\u044B\u043B", 16, 2, null ),
|
|
|
|
new Among ( "\u0435\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043C", -1, 2, null ),
|
|
|
|
new Among ( "\u044B\u043C", -1, 2, null ),
|
|
|
|
new Among ( "\u043D", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043D", 22, 2, null ),
|
|
|
|
new Among ( "\u043B\u043E", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u043B\u043E", 24, 2, null ),
|
|
|
|
new Among ( "\u044B\u043B\u043E", 24, 2, null ),
|
|
|
|
new Among ( "\u043D\u043E", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043D\u043E", 27, 2, null ),
|
|
|
|
new Among ( "\u043D\u043D\u043E", 27, 1, null ),
|
|
|
|
new Among ( "\u0435\u0442", -1, 1, null ),
|
|
|
|
new Among ( "\u0443\u0435\u0442", 30, 2, null ),
|
|
|
|
new Among ( "\u0438\u0442", -1, 2, null ),
|
|
|
|
new Among ( "\u044B\u0442", -1, 2, null ),
|
|
|
|
new Among ( "\u044E\u0442", -1, 1, null ),
|
|
|
|
new Among ( "\u0443\u044E\u0442", 34, 2, null ),
|
|
|
|
new Among ( "\u044F\u0442", -1, 2, null ),
|
|
|
|
new Among ( "\u043D\u044B", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043D\u044B", 37, 2, null ),
|
|
|
|
new Among ( "\u0442\u044C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0442\u044C", 39, 2, null ),
|
|
|
|
new Among ( "\u044B\u0442\u044C", 39, 2, null ),
|
|
|
|
new Among ( "\u0435\u0448\u044C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0448\u044C", -1, 2, null ),
|
|
|
|
new Among ( "\u044E", -1, 2, null ),
|
|
|
|
new Among ( "\u0443\u044E", 44, 2, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_5 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0430", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0432", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u0432", -1, 1, null ),
|
|
|
|
new Among ( "\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0435", 3, 1, null ),
|
|
|
|
new Among ( "\u044C\u0435", 3, 1, null ),
|
|
|
|
new Among ( "\u0438", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0438", 6, 1, null ),
|
|
|
|
new Among ( "\u0438\u0438", 6, 1, null ),
|
|
|
|
new Among ( "\u0430\u043C\u0438", 6, 1, null ),
|
|
|
|
new Among ( "\u044F\u043C\u0438", 6, 1, null ),
|
|
|
|
new Among ( "\u0438\u044F\u043C\u0438", 10, 1, null ),
|
|
|
|
new Among ( "\u0439", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u0439", 12, 1, null ),
|
|
|
|
new Among ( "\u0438\u0435\u0439", 13, 1, null ),
|
|
|
|
new Among ( "\u0438\u0439", 12, 1, null ),
|
|
|
|
new Among ( "\u043E\u0439", 12, 1, null ),
|
|
|
|
new Among ( "\u0430\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0435\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u0435\u043C", 18, 1, null ),
|
|
|
|
new Among ( "\u043E\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u044F\u043C", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u044F\u043C", 21, 1, null ),
|
|
|
|
new Among ( "\u043E", -1, 1, null ),
|
|
|
|
new Among ( "\u0443", -1, 1, null ),
|
|
|
|
new Among ( "\u0430\u0445", -1, 1, null ),
|
|
|
|
new Among ( "\u044F\u0445", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u044F\u0445", 26, 1, null ),
|
|
|
|
new Among ( "\u044B", -1, 1, null ),
|
|
|
|
new Among ( "\u044C", -1, 1, null ),
|
|
|
|
new Among ( "\u044E", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u044E", 30, 1, null ),
|
|
|
|
new Among ( "\u044C\u044E", 30, 1, null ),
|
|
|
|
new Among ( "\u044F", -1, 1, null ),
|
|
|
|
new Among ( "\u0438\u044F", 33, 1, null ),
|
|
|
|
new Among ( "\u044C\u044F", 33, 1, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_6 =
|
|
|
|
{
|
|
|
|
new Among ( "\u043E\u0441\u0442", -1, 1, null ),
|
|
|
|
new Among ( "\u043E\u0441\u0442\u044C", -1, 1, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private readonly static Among[] a_7 =
|
|
|
|
{
|
|
|
|
new Among ( "\u0435\u0439\u0448\u0435", -1, 1, null ),
|
|
|
|
new Among ( "\u043D", -1, 2, null ),
|
|
|
|
new Among ( "\u0435\u0439\u0448", -1, 1, null ),
|
|
|
|
new Among ( "\u044C", -1, 3, null )
|
|
|
|
};
|
|
|
|
|
|
|
|
private static readonly char[] g_v = { (char)33, (char)65, (char)8, (char)232 };
|
|
|
|
private int I_p2;
|
|
|
|
private int I_pV;
|
|
|
|
|
|
|
|
private void copy_from(RussianStemmer other)
|
|
|
|
{
|
|
|
|
I_p2 = other.I_p2;
|
|
|
|
I_pV = other.I_pV;
|
|
|
|
copy_from(other);
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_mark_regions()
|
|
|
|
{
|
|
|
|
bool root = false;
|
|
|
|
bool subroot = false;
|
|
|
|
int v_1;
|
|
|
|
|
|
|
|
// (, line 57
|
|
|
|
|
|
|
|
I_pV = limit;
|
|
|
|
|
|
|
|
I_p2 = limit;
|
|
|
|
|
|
|
|
// do, line 61
|
|
|
|
|
|
|
|
v_1 = cursor;
|
|
|
|
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// (, line 61
|
|
|
|
// gopast, line 62
|
|
|
|
while (true)
|
|
|
|
{
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (!(in_grouping(g_v, 1072, 1103)))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
if (cursor >= limit)
|
|
|
|
{
|
|
|
|
root = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
cursor++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (root) break;
|
|
|
|
root = false;
|
|
|
|
subroot = false;
|
|
|
|
// setmark pV, line 62
|
|
|
|
I_pV = cursor;
|
|
|
|
// gopast, line 62
|
|
|
|
while (true)
|
|
|
|
{
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (!(out_grouping(g_v, 1072, 1103)))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
if (cursor >= limit)
|
|
|
|
{
|
|
|
|
root = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
cursor++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (root) break;
|
|
|
|
root = false;
|
|
|
|
subroot = false;
|
|
|
|
// gopast, line 63
|
|
|
|
while (true)
|
|
|
|
{
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (!(in_grouping(g_v, 1072, 1103)))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
if (cursor >= limit)
|
|
|
|
{
|
|
|
|
root = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
cursor++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (root) break;
|
|
|
|
root = false;
|
|
|
|
subroot = false;
|
|
|
|
// gopast, line 63
|
|
|
|
while (true)
|
|
|
|
{
|
|
|
|
do
|
|
|
|
{
|
|
|
|
if (!(out_grouping(g_v, 1072, 1103)))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
if (cursor >= limit)
|
|
|
|
{
|
|
|
|
root = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
cursor++;
|
|
|
|
}
|
|
|
|
if (root) break;
|
|
|
|
// setmark p2, line 63
|
|
|
|
I_p2 = cursor;
|
|
|
|
} while (false);
|
|
|
|
cursor = v_1;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_R2()
|
|
|
|
{
|
|
|
|
if (!(I_p2 <= cursor))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_perfective_gerund()
|
|
|
|
{
|
|
|
|
bool subroot = false;
|
|
|
|
int among_var;
|
|
|
|
int v_1;
|
|
|
|
// (, line 71
|
|
|
|
// [, line 72
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 72
|
|
|
|
among_var = find_among_b(a_0, 9);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 72
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 76
|
|
|
|
// or, line 76
|
|
|
|
do
|
|
|
|
{
|
|
|
|
v_1 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// literal, line 76
|
|
|
|
if (!(eq_s_b(1, "\u0430")))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
cursor = limit - v_1;
|
|
|
|
// literal, line 76
|
|
|
|
if (!(eq_s_b(1, "\u044F")))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
// delete, line 76
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
// (, line 83
|
|
|
|
// delete, line 83
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_adjective()
|
|
|
|
{
|
|
|
|
int among_var;
|
|
|
|
// (, line 87
|
|
|
|
// [, line 88
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 88
|
|
|
|
among_var = find_among_b(a_1, 26);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 88
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 97
|
|
|
|
// delete, line 97
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_adjectival()
|
|
|
|
{
|
|
|
|
bool root = false;
|
|
|
|
bool subroot = false;
|
|
|
|
int among_var;
|
|
|
|
int v_1;
|
|
|
|
int v_2;
|
|
|
|
// (, line 101
|
|
|
|
// call adjective, line 102
|
|
|
|
if (!r_adjective())
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// try, line 109
|
|
|
|
v_1 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// (, line 109
|
|
|
|
// [, line 110
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 110
|
|
|
|
among_var = find_among_b(a_2, 8);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
cursor = limit - v_1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// ], line 110
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
cursor = limit - v_1;
|
|
|
|
goto default;
|
|
|
|
case 1:
|
|
|
|
// (, line 115
|
|
|
|
// or, line 115
|
|
|
|
do
|
|
|
|
{
|
|
|
|
v_2 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// literal, line 115
|
|
|
|
if (!(eq_s_b(1, "\u0430")))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
if (subroot) break;
|
|
|
|
cursor = limit - v_2;
|
|
|
|
// literal, line 115
|
|
|
|
if (!(eq_s_b(1, "\u044F")))
|
|
|
|
{
|
|
|
|
cursor = limit - v_1;
|
|
|
|
goto default;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
// delete, line 115
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
// (, line 122
|
|
|
|
// delete, line 122
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
default: root = true; break;
|
|
|
|
}
|
|
|
|
if (root) break;
|
|
|
|
} while (false);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_reflexive()
|
|
|
|
{
|
|
|
|
int among_var;
|
|
|
|
// (, line 128
|
|
|
|
// [, line 129
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 129
|
|
|
|
among_var = find_among_b(a_3, 2);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 129
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 132
|
|
|
|
// delete, line 132
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_verb()
|
|
|
|
{
|
|
|
|
bool subroot = false;
|
|
|
|
int among_var;
|
|
|
|
int v_1;
|
|
|
|
// (, line 136
|
|
|
|
// [, line 137
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 137
|
|
|
|
among_var = find_among_b(a_4, 46);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 137
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 143
|
|
|
|
// or, line 143
|
|
|
|
do
|
|
|
|
{
|
|
|
|
v_1 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// literal, line 143
|
|
|
|
if (!(eq_s_b(1, "\u0430")))
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
cursor = limit - v_1;
|
|
|
|
// literal, line 143
|
|
|
|
if (!(eq_s_b(1, "\u044F")))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
// delete, line 143
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
// (, line 151
|
|
|
|
// delete, line 151
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_noun()
|
|
|
|
{
|
|
|
|
int among_var;
|
|
|
|
// (, line 159
|
|
|
|
// [, line 160
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 160
|
|
|
|
among_var = find_among_b(a_5, 36);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 160
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 167
|
|
|
|
// delete, line 167
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_derivational()
|
|
|
|
{
|
|
|
|
int among_var;
|
|
|
|
// (, line 175
|
|
|
|
// [, line 176
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 176
|
|
|
|
among_var = find_among_b(a_6, 2);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 176
|
|
|
|
bra = cursor;
|
|
|
|
// call R2, line 176
|
|
|
|
if (!r_R2())
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 179
|
|
|
|
// delete, line 179
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
private bool r_tidy_up()
|
|
|
|
{
|
|
|
|
int among_var;
|
|
|
|
// (, line 183
|
|
|
|
// [, line 184
|
|
|
|
ket = cursor;
|
|
|
|
// substring, line 184
|
|
|
|
among_var = find_among_b(a_7, 4);
|
|
|
|
if (among_var == 0)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 184
|
|
|
|
bra = cursor;
|
|
|
|
switch (among_var)
|
|
|
|
{
|
|
|
|
case 0:
|
|
|
|
return false;
|
|
|
|
|
|
|
|
case 1:
|
|
|
|
// (, line 188
|
|
|
|
// delete, line 188
|
|
|
|
slice_del();
|
|
|
|
// [, line 189
|
|
|
|
ket = cursor;
|
|
|
|
// literal, line 189
|
|
|
|
if (!(eq_s_b(1, "\u043D")))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// ], line 189
|
|
|
|
bra = cursor;
|
|
|
|
// literal, line 189
|
|
|
|
if (!(eq_s_b(1, "\u043D")))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// delete, line 189
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 2:
|
|
|
|
// (, line 192
|
|
|
|
// literal, line 192
|
|
|
|
if (!(eq_s_b(1, "\u043D")))
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
// delete, line 192
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 3:
|
|
|
|
// (, line 194
|
|
|
|
// delete, line 194
|
|
|
|
slice_del();
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
public bool CanStem()
|
|
|
|
{
|
|
|
|
bool root = false;
|
|
|
|
bool subroot = false;
|
|
|
|
int v_1;
|
|
|
|
int v_2;
|
|
|
|
int v_3;
|
|
|
|
int v_4;
|
|
|
|
int v_5;
|
|
|
|
int v_6;
|
|
|
|
int v_7;
|
|
|
|
int v_8;
|
|
|
|
int v_9;
|
|
|
|
int v_10;
|
|
|
|
// (, line 199
|
|
|
|
// do, line 201
|
|
|
|
v_1 = cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call mark_regions, line 201
|
|
|
|
if (!r_mark_regions())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
cursor = v_1;
|
|
|
|
// backwards, line 202
|
|
|
|
limit_backward = cursor; cursor = limit;
|
|
|
|
// setlimit, line 202
|
|
|
|
v_2 = limit - cursor;
|
|
|
|
// tomark, line 202
|
|
|
|
if (cursor < I_pV)
|
|
|
|
{
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
cursor = I_pV;
|
|
|
|
v_3 = limit_backward;
|
|
|
|
limit_backward = cursor;
|
|
|
|
cursor = limit - v_2;
|
|
|
|
// (, line 202
|
|
|
|
// do, line 203
|
|
|
|
v_4 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// (, line 203
|
|
|
|
// or, line 204
|
|
|
|
do
|
|
|
|
{
|
|
|
|
v_5 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call perfective_gerund, line 204
|
|
|
|
if (!r_perfective_gerund())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
cursor = limit - v_5;
|
|
|
|
// (, line 205
|
|
|
|
// try, line 205
|
|
|
|
v_6 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call reflexive, line 205
|
|
|
|
if (!r_reflexive())
|
|
|
|
{
|
|
|
|
cursor = limit - v_6;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
// or, line 206
|
|
|
|
subroot = false;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
v_7 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call adjectival, line 206
|
|
|
|
if (!r_adjectival())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
cursor = limit - v_7;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call verb, line 206
|
|
|
|
if (!r_verb())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
subroot = true;
|
|
|
|
if (subroot) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (subroot) break;
|
|
|
|
|
|
|
|
cursor = limit - v_7;
|
|
|
|
// call noun, line 206
|
|
|
|
if (!r_noun())
|
|
|
|
{
|
|
|
|
root = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (root) break;
|
|
|
|
} while (false);
|
|
|
|
|
|
|
|
if (root) break;
|
|
|
|
} while (false);
|
|
|
|
cursor = limit - v_4;
|
|
|
|
|
|
|
|
root = false;
|
|
|
|
subroot = false;
|
|
|
|
|
|
|
|
// try, line 209
|
|
|
|
v_8 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// (, line 209
|
|
|
|
// [, line 209
|
|
|
|
ket = cursor;
|
|
|
|
// literal, line 209
|
|
|
|
if (!(eq_s_b(1, "\u0438")))
|
|
|
|
{
|
|
|
|
cursor = limit - v_8;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
// ], line 209
|
|
|
|
bra = cursor;
|
|
|
|
// delete, line 209
|
|
|
|
slice_del();
|
|
|
|
} while (false);
|
|
|
|
// do, line 212
|
|
|
|
v_9 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call derivational, line 212
|
|
|
|
if (!r_derivational())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
cursor = limit - v_9;
|
|
|
|
// do, line 213
|
|
|
|
v_10 = limit - cursor;
|
|
|
|
do
|
|
|
|
{
|
|
|
|
// call tidy_up, line 213
|
|
|
|
if (!r_tidy_up())
|
|
|
|
{
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
} while (false);
|
|
|
|
cursor = limit - v_10;
|
|
|
|
limit_backward = v_3;
|
|
|
|
cursor = limit_backward;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
public string Lex(string s)
|
|
|
|
{
|
|
|
|
this.setCurrent(s.ToLowerInvariant());
|
|
|
|
this.CanStem();
|
|
|
|
return this.getCurrent();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|