Searched defs:stopwords (Results 1 - 25 of 38) sorted by relevance

12

/lucene-3.6.0/lucene/core/src/java/org/apache/lucene/analysis/
H A DStopAnalyzer.java37 * supplementary characters in stopwords
89 * @param stopwords Reader to load stop words from */
90 public StopAnalyzer(Version matchVersion, Reader stopwords) throws IOException { argument
91 this(matchVersion, WordlistLoader.getWordSet(stopwords, matchVersion));
108 source, stopwords));
H A DStopwordAnalyzerBase.java40 protected final CharArraySet stopwords; field in class:StopwordAnalyzerBase
46 * stopwords
49 * stopwords
52 return stopwords;
60 * @param stopwords
63 protected StopwordAnalyzerBase(final Version version, final Set<?> stopwords) { argument
65 // analyzers should use char array set for stopwords!
66 this.stopwords = stopwords == null ? CharArraySet.EMPTY_SET : CharArraySet
67 .unmodifiableSet(CharArraySet.copy(version, stopwords));
124 loadStopwordSet(File stopwords, Version matchVersion) argument
148 loadStopwordSet(Reader stopwords, Version matchVersion) argument
[all...]
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/cjk/
H A DCJKAnalyzer.java38 * and filters stopwords with {@link StopFilter}
90 * @param stopwords
93 public CJKAnalyzer(Version matchVersion, Set<?> stopwords){ argument
94 super(matchVersion, stopwords);
119 return new TokenStreamComponents(source, new StopFilter(matchVersion, result, stopwords));
122 return new TokenStreamComponents(source, new StopFilter(matchVersion, source, stopwords));
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/da/
H A DDanishAnalyzer.java46 /** File containing default Danish stopwords. */
87 * @param stopwords a stopword set
89 public DanishAnalyzer(Version matchVersion, Set<?> stopwords) { argument
90 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
99 * @param stopwords a stopword set
102 public DanishAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
103 super(matchVersion, stopwords);
126 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/el/
H A DGreekAnalyzer.java37 * Supports an external list of stopwords (words
39 * A default set of stopwords is used unless an alternative list is specified.
55 /** File containing default Greek stopwords. */
56 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
59 * Returns a set of default Greek-stopwords
60 * @return a set of default Greek-stopwords
92 * <b>NOTE:</b> The stopwords set should be pre-processed with the logic of
97 * @param stopwords a stopword set
99 public GreekAnalyzer(Version matchVersion, Set<?> stopwords) { argument
100 super(matchVersion, stopwords);
109 GreekAnalyzer(Version matchVersion, String... stopwords) argument
118 GreekAnalyzer(Version matchVersion, Map<?,?> stopwords) argument
[all...]
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/en/
H A DEnglishAnalyzer.java70 * @param stopwords a stopword set
72 public EnglishAnalyzer(Version matchVersion, Set<?> stopwords) { argument
73 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
82 * @param stopwords a stopword set
85 public EnglishAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
86 super(matchVersion, stopwords);
112 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/es/
H A DSpanishAnalyzer.java53 /** File containing default Spanish stopwords. */
94 * @param stopwords a stopword set
96 public SpanishAnalyzer(Version matchVersion, Set<?> stopwords) { argument
97 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
106 * @param stopwords a stopword set
109 public SpanishAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
110 super(matchVersion, stopwords);
133 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/eu/
H A DBasqueAnalyzer.java44 /** File containing default Basque stopwords. */
45 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
85 * @param stopwords a stopword set
87 public BasqueAnalyzer(Version matchVersion, Set<?> stopwords) { argument
88 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
97 * @param stopwords a stopword set
100 public BasqueAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
101 super(matchVersion, stopwords);
124 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/fi/
H A DFinnishAnalyzer.java46 /** File containing default Italian stopwords. */
87 * @param stopwords a stopword set
89 public FinnishAnalyzer(Version matchVersion, Set<?> stopwords) { argument
90 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
99 * @param stopwords a stopword set
102 public FinnishAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
103 super(matchVersion, stopwords);
126 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/gl/
H A DGalicianAnalyzer.java44 /** File containing default Galician stopwords. */
45 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
85 * @param stopwords a stopword set
87 public GalicianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
88 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
97 * @param stopwords a stopword set
100 public GalicianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
101 super(matchVersion, stopwords);
124 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/hu/
H A DHungarianAnalyzer.java46 /** File containing default Hungarian stopwords. */
87 * @param stopwords a stopword set
89 public HungarianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
90 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
99 * @param stopwords a stopword set
102 public HungarianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
103 super(matchVersion, stopwords);
126 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/hy/
H A DArmenianAnalyzer.java44 /** File containing default Armenian stopwords. */
45 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
85 * @param stopwords a stopword set
87 public ArmenianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
88 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
97 * @param stopwords a stopword set
100 public ArmenianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
101 super(matchVersion, stopwords);
124 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/id/
H A DIndonesianAnalyzer.java39 /** File containing default Indonesian stopwords. */
40 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
82 * @param stopwords
85 public IndonesianAnalyzer(Version matchVersion, Set<?> stopwords){ argument
86 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
96 * @param stopwords
101 public IndonesianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet){ argument
102 super(matchVersion, stopwords);
124 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/lv/
H A DLatvianAnalyzer.java45 /** File containing default Latvian stopwords. */
46 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
86 * @param stopwords a stopword set
88 public LatvianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
89 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
98 * @param stopwords a stopword set
101 public LatvianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
102 super(matchVersion, stopwords);
125 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/no/
H A DNorwegianAnalyzer.java46 /** File containing default Norwegian stopwords. */
87 * @param stopwords a stopword set
89 public NorwegianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
90 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
99 * @param stopwords a stopword set
102 public NorwegianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
103 super(matchVersion, stopwords);
126 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/pt/
H A DPortugueseAnalyzer.java53 /** File containing default Portuguese stopwords. */
94 * @param stopwords a stopword set
96 public PortugueseAnalyzer(Version matchVersion, Set<?> stopwords) { argument
97 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
106 * @param stopwords a stopword set
109 public PortugueseAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
110 super(matchVersion, stopwords);
133 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/sv/
H A DSwedishAnalyzer.java46 /** File containing default Swedish stopwords. */
87 * @param stopwords a stopword set
89 public SwedishAnalyzer(Version matchVersion, Set<?> stopwords) { argument
90 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
99 * @param stopwords a stopword set
102 public SwedishAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
103 super(matchVersion, stopwords);
126 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/th/
H A DThaiAnalyzer.java41 * <li> As of 3.6, a set of Thai stopwords is used by default
46 /** File containing default Thai stopwords. */
47 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
49 * The comment character in the stopwords file.
94 * @param stopwords a stopword set
96 public ThaiAnalyzer(Version matchVersion, Set<?> stopwords) { argument
97 super(matchVersion, stopwords);
119 result, stopwords));
/lucene-3.6.0/lucene/core/src/java/org/apache/lucene/analysis/standard/
H A DClassicAnalyzer.java44 * supplementary characters in stopwords
94 * @param stopwords File to read stop words from
98 public ClassicAnalyzer(Version matchVersion, File stopwords) throws IOException { argument
99 this(matchVersion, WordlistLoader.getWordSet(IOUtils.getDecodingReader(stopwords,
107 * @param stopwords Reader to read stop words from */
108 public ClassicAnalyzer(Version matchVersion, Reader stopwords) throws IOException { argument
109 this(matchVersion, WordlistLoader.getWordSet(stopwords, matchVersion));
136 tok = new StopFilter(matchVersion, tok, stopwords);
H A DStandardAnalyzer.java43 * in stopwords. {@link ClassicTokenizer} and {@link ClassicAnalyzer}
90 * @param stopwords File to read stop words from
94 public StandardAnalyzer(Version matchVersion, File stopwords) throws IOException { argument
95 this(matchVersion, WordlistLoader.getWordSet(IOUtils.getDecodingReader(stopwords,
103 * @param stopwords Reader to read stop words from */
104 public StandardAnalyzer(Version matchVersion, Reader stopwords) throws IOException { argument
105 this(matchVersion, WordlistLoader.getWordSet(stopwords, matchVersion));
132 tok = new StopFilter(matchVersion, tok, stopwords);
H A DUAX29URLEmailAnalyzer.java72 * @param stopwords Reader to read stop words from */
73 public UAX29URLEmailAnalyzer(Version matchVersion, Reader stopwords) throws IOException { argument
74 this(matchVersion, WordlistLoader.getWordSet(stopwords, matchVersion));
100 tok = new StopFilter(matchVersion, tok, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/ar/
H A DArabicAnalyzer.java59 * File containing default Arabic stopwords.
64 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
67 * The comment character in the stopwords file. All lines prefixed with this will be ignored
114 * @param stopwords
117 public ArabicAnalyzer(Version matchVersion, Set<?> stopwords){ argument
118 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
128 * @param stopwords
133 public ArabicAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet){ argument
134 super(matchVersion, stopwords);
144 public ArabicAnalyzer( Version matchVersion, String... stopwords ) {
[all...]
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/bg/
H A DBulgarianAnalyzer.java49 * File containing default Bulgarian stopwords.
55 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
58 * The comment character in the stopwords file. All lines prefixed with this
106 public BulgarianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
107 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
115 public BulgarianAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
116 super(matchVersion, stopwords);
137 result = new StopFilter(matchVersion, result, stopwords);
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/br/
H A DBrazilianAnalyzer.java46 * Supports an external list of stopwords (words that
57 * List of typical Brazilian Portuguese stopwords.
82 /** File containing default Brazilian Portuguese stopwords. */
83 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
127 * @param stopwords
130 public BrazilianAnalyzer(Version matchVersion, Set<?> stopwords) { argument
131 super(matchVersion, stopwords);
139 * @param stopwords
142 public BrazilianAnalyzer(Version matchVersion, Set<?> stopwords, argument
144 this(matchVersion, stopwords);
154 BrazilianAnalyzer(Version matchVersion, String... stopwords) argument
163 BrazilianAnalyzer(Version matchVersion, Map<?,?> stopwords) argument
172 BrazilianAnalyzer(Version matchVersion, File stopwords) argument
[all...]
/lucene-3.6.0/lucene/contrib/analyzers/common/src/java/org/apache/lucene/analysis/ca/
H A DCatalanAnalyzer.java54 /** File containing default Catalan stopwords. */
55 public final static String DEFAULT_STOPWORD_FILE = "stopwords.txt";
101 * @param stopwords a stopword set
103 public CatalanAnalyzer(Version matchVersion, Set<?> stopwords) { argument
104 this(matchVersion, stopwords, CharArraySet.EMPTY_SET);
113 * @param stopwords a stopword set
116 public CatalanAnalyzer(Version matchVersion, Set<?> stopwords, Set<?> stemExclusionSet) { argument
117 super(matchVersion, stopwords);
143 result = new StopFilter(matchVersion, result, stopwords);

Completed in 39 milliseconds

12