Coverage Report - org.crosswire.jsword.index.lucene.analysis.EnglishLuceneAnalyzer
 
Classes in this File Line Coverage Branch Coverage Complexity
EnglishLuceneAnalyzer
0%
0/20
0%
0/14
3.333
 
 1  
 /**
 2  
  * Distribution License:
 3  
  * JSword is free software; you can redistribute it and/or modify it under
 4  
  * the terms of the GNU Lesser General Public License, version 2.1 or later
 5  
  * as published by the Free Software Foundation. This program is distributed
 6  
  * in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
 7  
  * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 8  
  * See the GNU Lesser General Public License for more details.
 9  
  *
 10  
  * The License is available on the internet at:
 11  
  *      http://www.gnu.org/copyleft/lgpl.html
 12  
  * or by writing to:
 13  
  *      Free Software Foundation, Inc.
 14  
  *      59 Temple Place - Suite 330
 15  
  *      Boston, MA 02111-1307, USA
 16  
  *
 17  
  * © CrossWire Bible Society, 2007 - 2016
 18  
  *
 19  
  */
 20  
 package org.crosswire.jsword.index.lucene.analysis;
 21  
 
 22  
 import java.io.IOException;
 23  
 import java.io.Reader;
 24  
 
 25  
 import org.apache.lucene.analysis.LowerCaseTokenizer;
 26  
 import org.apache.lucene.analysis.PorterStemFilter;
 27  
 import org.apache.lucene.analysis.StopAnalyzer;
 28  
 import org.apache.lucene.analysis.StopFilter;
 29  
 import org.apache.lucene.analysis.TokenStream;
 30  
 import org.apache.lucene.util.Version;
 31  
 
 32  
 /**
 33  
  * English Analyzer works like lucene SimpleAnalyzer + Stemming.
 34  
  * (LowerCaseTokenizer > PorterStemFilter). Like the AbstractAnalyzer,
 35  
  * {@link StopFilter} is off by default.
 36  
  * 
 37  
  * 
 38  
  * @see gnu.lgpl.License The GNU Lesser General Public License for details.
 39  
  * @author sijo cherian
 40  
  */
 41  
 public class EnglishLuceneAnalyzer extends AbstractBookAnalyzer {
 42  
 
 43  0
     public EnglishLuceneAnalyzer() {
 44  0
         stopSet = StopAnalyzer.ENGLISH_STOP_WORDS_SET;
 45  0
     }
 46  
 
 47  
     /**
 48  
      * Constructs a {@link LowerCaseTokenizer} filtered by a language filter
 49  
      * {@link StopFilter} and {@link PorterStemFilter} for English.
 50  
      */
 51  
     @Override
 52  
     public final TokenStream tokenStream(String fieldName, Reader reader) {
 53  0
         TokenStream result = new LowerCaseTokenizer(reader);
 54  
 
 55  0
         if (doStopWords && stopSet != null) {
 56  0
             result = new StopFilter(StopFilter.getEnablePositionIncrementsVersionDefault(matchVersion), result, stopSet);
 57  
         }
 58  
 
 59  
         // Using Porter Stemmer
 60  0
         if (doStemming) {
 61  0
             result = new PorterStemFilter(result);
 62  
         }
 63  
 
 64  0
         return result;
 65  
     }
 66  
 
 67  
     /* (non-Javadoc)
 68  
      * @see org.apache.lucene.analysis.Analyzer#reusableTokenStream(java.lang.String, java.io.Reader)
 69  
      */
 70  
     @Override
 71  
     public TokenStream reusableTokenStream(String fieldName, Reader reader) throws IOException {
 72  0
         SavedStreams streams = (SavedStreams) getPreviousTokenStream();
 73  0
         if (streams == null) {
 74  0
             streams = new SavedStreams(new LowerCaseTokenizer(reader));
 75  0
             if (doStopWords && stopSet != null) {
 76  0
                 streams.setResult(new StopFilter(StopFilter.getEnablePositionIncrementsVersionDefault(matchVersion), streams.getResult(), stopSet));
 77  
             }
 78  
 
 79  0
             if (doStemming) {
 80  0
                 streams.setResult(new PorterStemFilter(streams.getResult()));
 81  
             }
 82  
 
 83  0
             setPreviousTokenStream(streams);
 84  
         } else {
 85  0
             streams.getSource().reset(reader);
 86  
         }
 87  0
         return streams.getResult();
 88  
     }
 89  
 
 90  0
     private final Version matchVersion = Version.LUCENE_29;
 91  
 }