Class KStemmer


  • public class KStemmer
    extends java.lang.Object
    This class implements the Kstem algorithm
    • Field Detail

      • exceptionWords

        private static final java.lang.String[] exceptionWords
      • directConflations

        private static final java.lang.String[][] directConflations
      • countryNationality

        private static final java.lang.String[][] countryNationality
      • supplementDict

        private static final java.lang.String[] supplementDict
      • properNouns

        private static final java.lang.String[] properNouns
      • word

        private final OpenStringBuilder word
        caching off private int maxCacheSize; private CharArrayMap cache = null; private static final String SAME = "SAME"; // use if stemmed form is the same
      • j

        private int j
      • k

        private int k
      • ization

        private static char[] ization
      • ition

        private static char[] ition
      • ation

        private static char[] ation
      • ication

        private static char[] ication
      • result

        java.lang.String result
    • Constructor Detail

      • KStemmer

        KStemmer()
    • Method Detail

      • finalChar

        private char finalChar()
      • penultChar

        private char penultChar()
      • isVowel

        private boolean isVowel​(int index)
      • isCons

        private boolean isCons​(int index)
      • isAlpha

        private boolean isAlpha​(char ch)
      • stemLength

        private int stemLength()
      • endsIn

        private boolean endsIn​(char[] s)
      • endsIn

        private boolean endsIn​(char a,
                               char b)
      • endsIn

        private boolean endsIn​(char a,
                               char b,
                               char c)
      • endsIn

        private boolean endsIn​(char a,
                               char b,
                               char c,
                               char d)
      • plural

        private void plural()
      • setSuffix

        private void setSuffix​(java.lang.String s)
      • setSuff

        private void setSuff​(java.lang.String s,
                             int len)
      • lookup

        private boolean lookup()
      • pastTense

        private void pastTense()
      • doubleC

        private boolean doubleC​(int i)
      • vowelInStem

        private boolean vowelInStem()
      • aspect

        private void aspect()
      • ityEndings

        private void ityEndings()
      • nceEndings

        private void nceEndings()
      • nessEndings

        private void nessEndings()
      • ismEndings

        private void ismEndings()
      • mentEndings

        private void mentEndings()
      • izeEndings

        private void izeEndings()
      • ncyEndings

        private void ncyEndings()
      • bleEndings

        private void bleEndings()
      • icEndings

        private void icEndings()
      • ionEndings

        private void ionEndings()
      • erAndOrEndings

        private void erAndOrEndings()
      • lyEndings

        private void lyEndings()
      • alEndings

        private void alEndings()
      • iveEndings

        private void iveEndings()
      • stem

        java.lang.String stem​(java.lang.String term)
      • asString

        java.lang.String asString()
        Returns the result of the stem (assuming the word was changed) as a String.
      • asCharSequence

        java.lang.CharSequence asCharSequence()
      • getString

        java.lang.String getString()
      • getChars

        char[] getChars()
      • getLength

        int getLength()
      • matched

        private boolean matched()
      • stem

        boolean stem​(char[] term,
                     int len)
        Stems the text in the token. Returns true if changed.