Package org.apache.lucene.analysis.en

Examples of org.apache.lucene.analysis.en.EnglishPossessiveFilter


    @Override
    protected TokenStreamComponents createComponents(String fieldName, Reader reader) {
        final Tokenizer source = new StandardTokenizer(matchVersion, reader);
        TokenStream result = new StandardFilter(matchVersion, source);
        if (matchVersion.onOrAfter(Version.LUCENE_31)) {
            result = new EnglishPossessiveFilter(result);
        }
        result = new LowerCaseFilter(matchVersion, result);
        ShingleAllStopFilter sf = new ShingleAllStopFilter(result, minNGram, maxNGram, stopwords);
        sf.setOutputUnigrams(outputUnigrams);
        if (!outputUnigrams) {
View Full Code Here


        final Tokenizer source = new StandardTokenizer(matchVersion, reader);
        TokenStream result = new StandardFilter(matchVersion, source);
        // prior to this we get the classic behavior, standardfilter does it for
        // us.
        if (matchVersion.onOrAfter(Version.LUCENE_31)) {
            result = new EnglishPossessiveFilter(result);
        }
        result = new LowerCaseFilter(matchVersion, result);
        result = new StopFilter(matchVersion, result, stopwords);
        if (stem) {
            if (!stemExclusionSet.isEmpty())
View Full Code Here

                return new SnowballFilter(tokenStream, new PorterStemmer());
            }
        } else if ("minimal_english".equalsIgnoreCase(language) || "minimalEnglish".equalsIgnoreCase(language)) {
            return new EnglishMinimalStemFilter(tokenStream);
        } else if ("possessive_english".equalsIgnoreCase(language) || "possessiveEnglish".equalsIgnoreCase(language)) {
            return new EnglishPossessiveFilter(tokenStream);

            // Finnish stemmers
        } else if ("finnish".equalsIgnoreCase(language)) {
            return new SnowballFilter(tokenStream, new FinnishStemmer());
        } else if ("light_finish".equalsIgnoreCase(language) || "lightFinish".equalsIgnoreCase(language)) {
View Full Code Here

      tokenizer = new StandardTokenizer40();
    }
    TokenStream result = tokenizer;
    // remove the possessive 's for english stemmers
    if (name.equals("English") || name.equals("Porter") || name.equals("Lovins"))
      result = new EnglishPossessiveFilter(result);
    // Use a special lowercase filter for turkish, the stemmer expects it.
    if (name.equals("Turkish"))
      result = new TurkishLowerCaseFilter(result);
    else
      result = new LowerCaseFilter(result);
View Full Code Here

    TokenStream result = new StandardTokenizer(matchVersion, reader);
    result = new StandardFilter(matchVersion, result);
    // remove the possessive 's for english stemmers
    if (matchVersion.onOrAfter(Version.LUCENE_31) &&
        (name.equals("English") || name.equals("Porter") || name.equals("Lovins")))
      result = new EnglishPossessiveFilter(result);
    // Use a special lowercase filter for turkish, the stemmer expects it.
    if (matchVersion.onOrAfter(Version.LUCENE_31) && name.equals("Turkish"))
      result = new TurkishLowerCaseFilter(result);
    else
      result = new LowerCaseFilter(matchVersion, result);
View Full Code Here

TOP

Related Classes of org.apache.lucene.analysis.en.EnglishPossessiveFilter

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.