You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
Zero/ZeroLevel/Services/Semantic/Snowball/CzechStemmer.cs

35 lines
1.1 KiB

/*
* Port of Snowball stemmers on C#
* Original stemmers can be found on http://snowball.tartarus.org
* Licence still BSD: http://snowball.tartarus.org/license.php
*
* Most of stemmers are ported from Java by Iveonik Systems ltd. (www.iveonik.com)
*/
using ZeroLevel.Services.Semantic;
namespace Iveonik.Stemmers
{
public class CzechStemmer : StemmerOperations, ILexer
{
public string Lex(string input)
{
setCurrent(input.ToLowerInvariant());
// stemming...
//removes case endings from nouns and adjectives
removeCase();
//removes possesive endings from names -ov- and -in-
removePossessives();
//removes comparative endings
removeComparative();
//removes diminutive endings
removeDiminutive();
//removes augmentatives endings
removeAugmentative();
//removes derivational sufixes from nouns
removeDerivational();
//result = sb.toString();
return getCurrent(); //sb.ToString();
}
}
}

Powered by TurnKey Linux.