public class CapitalizationFilterFactory extends BaseTokenFilterFactory
<fieldType name="text_cptlztn" class="solr.TextField" positionIncrementGap="100"> <analyzer> <tokenizer class="solr.WhitespaceTokenizerFactory"/> <filter class="solr.CapitalizationFilterFactory" onlyFirstWord="true" keep="java solr lucene" keepIgnoreCase="false" okPrefix="McK McD McA"/> </analyzer> </fieldType>
Modifier and Type | Field and Description |
---|---|
static int |
DEFAULT_MAX_WORD_COUNT |
static java.lang.String |
FORCE_FIRST_LETTER |
(package private) boolean |
forceFirstLetter |
(package private) org.apache.lucene.analysis.CharArraySet |
keep |
static java.lang.String |
KEEP |
static java.lang.String |
KEEP_IGNORE_CASE |
static java.lang.String |
MAX_TOKEN_LENGTH |
static java.lang.String |
MAX_WORD_COUNT |
(package private) int |
maxTokenLength |
(package private) int |
maxWordCount |
static java.lang.String |
MIN_WORD_LENGTH |
(package private) int |
minWordLength |
static java.lang.String |
OK_PREFIX |
(package private) java.util.Collection<char[]> |
okPrefix |
static java.lang.String |
ONLY_FIRST_WORD |
(package private) boolean |
onlyFirstWord |
log
args, luceneMatchVersion
Constructor and Description |
---|
CapitalizationFilterFactory() |
Modifier and Type | Method and Description |
---|---|
CapitalizationFilter |
create(org.apache.lucene.analysis.TokenStream input)
Transform the specified input TokenStream
|
void |
init(java.util.Map<java.lang.String,java.lang.String> args)
init will be called just once, immediately after creation. |
void |
processWord(char[] buffer,
int offset,
int length,
int wordCount) |
assureMatchVersion, getArgs, getBoolean, getBoolean, getInt, getInt, getInt, getSnowballWordSet, getWordSet, warnDeprecated
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait
getArgs
public static final int DEFAULT_MAX_WORD_COUNT
public static final java.lang.String KEEP
public static final java.lang.String KEEP_IGNORE_CASE
public static final java.lang.String OK_PREFIX
public static final java.lang.String MIN_WORD_LENGTH
public static final java.lang.String MAX_WORD_COUNT
public static final java.lang.String MAX_TOKEN_LENGTH
public static final java.lang.String ONLY_FIRST_WORD
public static final java.lang.String FORCE_FIRST_LETTER
org.apache.lucene.analysis.CharArraySet keep
java.util.Collection<char[]> okPrefix
int minWordLength
int maxWordCount
int maxTokenLength
boolean onlyFirstWord
boolean forceFirstLetter
public void init(java.util.Map<java.lang.String,java.lang.String> args)
TokenFilterFactory
init
will be called just once, immediately after creation.
The args are user-level initialization parameters that may be specified when declaring the factory in the schema.xml
init
in interface TokenFilterFactory
init
in class BaseTokenStreamFactory
public void processWord(char[] buffer, int offset, int length, int wordCount)
public CapitalizationFilter create(org.apache.lucene.analysis.TokenStream input)
TokenFilterFactory