public class WordDelimiterGraphFilterFactory extends TokenFilterFactory implements ResourceLoaderAware
WordDelimiterGraphFilter
.
<fieldType name="text_wd" class="solr.TextField" positionIncrementGap="100"> <analyzer> <tokenizer class="solr.WhitespaceTokenizerFactory"/> <filter class="solr.WordDelimiterGraphFilterFactory" protected="protectedword.txt" preserveOriginal="0" splitOnNumerics="1" splitOnCaseChange="1" catenateWords="0" catenateNumbers="0" catenateAll="0" generateWordParts="1" generateNumberParts="1" stemEnglishPossessive="1" types="wdfftypes.txt" /> </analyzer> </fieldType>
Modifier and Type | Field and Description |
---|---|
private int |
flags |
(package private) char[] |
out |
static java.lang.String |
PROTECTED_TOKENS |
private CharArraySet |
protectedWords |
private static java.util.regex.Pattern |
typePattern |
private java.lang.String |
types |
static java.lang.String |
TYPES |
(package private) byte[] |
typeTable |
private java.lang.String |
wordFiles |
LUCENE_MATCH_VERSION_PARAM, luceneMatchVersion
Constructor and Description |
---|
WordDelimiterGraphFilterFactory(java.util.Map<java.lang.String,java.lang.String> args)
Creates a new WordDelimiterGraphFilterFactory
|
Modifier and Type | Method and Description |
---|---|
TokenFilter |
create(TokenStream input)
Transform the specified input TokenStream
|
void |
inform(ResourceLoader loader)
Initializes this component with the provided ResourceLoader
(used for loading classes, files, etc).
|
private java.lang.String |
parseString(java.lang.String s) |
private java.lang.Byte |
parseType(java.lang.String s) |
private byte[] |
parseTypes(java.util.List<java.lang.String> rules) |
availableTokenFilters, forName, lookupClass, reloadTokenFilters
get, get, get, get, get, getBoolean, getChar, getClassArg, getFloat, getInt, getLines, getLuceneMatchVersion, getOriginalArgs, getPattern, getSet, getSnowballWordSet, getWordSet, isExplicitLuceneMatchVersion, require, require, require, requireBoolean, requireChar, requireFloat, requireInt, setExplicitLuceneMatchVersion, splitFileNames
public static final java.lang.String PROTECTED_TOKENS
public static final java.lang.String TYPES
private final java.lang.String wordFiles
private final java.lang.String types
private final int flags
byte[] typeTable
private CharArraySet protectedWords
private static java.util.regex.Pattern typePattern
char[] out
public WordDelimiterGraphFilterFactory(java.util.Map<java.lang.String,java.lang.String> args)
public void inform(ResourceLoader loader) throws java.io.IOException
ResourceLoaderAware
inform
in interface ResourceLoaderAware
java.io.IOException
public TokenFilter create(TokenStream input)
TokenFilterFactory
create
in class TokenFilterFactory
private byte[] parseTypes(java.util.List<java.lang.String> rules)
private java.lang.Byte parseType(java.lang.String s)
private java.lang.String parseString(java.lang.String s)