public class WordDelimiterGraphFilterFactory extends TokenFilterFactory implements ResourceLoaderAware
WordDelimiterGraphFilter
.
<fieldType name="text_wd" class="solr.TextField" positionIncrementGap="100"> <analyzer> <tokenizer class="solr.WhitespaceTokenizerFactory"/> <filter class="solr.WordDelimiterGraphFilterFactory" protected="protectedword.txt" preserveOriginal="0" splitOnNumerics="1" splitOnCaseChange="1" catenateWords="0" catenateNumbers="0" catenateAll="0" generateWordParts="1" generateNumberParts="1" stemEnglishPossessive="1" types="wdfftypes.txt" /> </analyzer> </fieldType>
Modifier and Type | Field and Description |
---|---|
private boolean |
adjustOffsets |
private int |
flags |
static java.lang.String |
OFFSETS |
(package private) char[] |
out |
static java.lang.String |
PROTECTED_TOKENS |
private CharArraySet |
protectedWords |
private static java.util.regex.Pattern |
typePattern |
private java.lang.String |
types |
static java.lang.String |
TYPES |
(package private) byte[] |
typeTable |
private java.lang.String |
wordFiles |
LUCENE_MATCH_VERSION_PARAM, luceneMatchVersion
Constructor and Description |
---|
WordDelimiterGraphFilterFactory(java.util.Map<java.lang.String,java.lang.String> args)
Creates a new WordDelimiterGraphFilterFactory
|
Modifier and Type | Method and Description |
---|---|
TokenFilter |
create(TokenStream input)
Transform the specified input TokenStream
|
void |
inform(ResourceLoader loader)
Initializes this component with the provided ResourceLoader
(used for loading classes, files, etc).
|
private java.lang.String |
parseString(java.lang.String s) |
private java.lang.Byte |
parseType(java.lang.String s) |
private byte[] |
parseTypes(java.util.List<java.lang.String> rules) |
availableTokenFilters, forName, lookupClass, normalize, reloadTokenFilters
get, get, get, get, get, getBoolean, getChar, getClassArg, getFloat, getInt, getLines, getLuceneMatchVersion, getOriginalArgs, getPattern, getSet, getSnowballWordSet, getWordSet, isExplicitLuceneMatchVersion, require, require, require, requireBoolean, requireChar, requireFloat, requireInt, setExplicitLuceneMatchVersion, splitAt, splitFileNames
public static final java.lang.String PROTECTED_TOKENS
public static final java.lang.String TYPES
public static final java.lang.String OFFSETS
private final java.lang.String wordFiles
private final java.lang.String types
private final int flags
byte[] typeTable
private CharArraySet protectedWords
private boolean adjustOffsets
private static java.util.regex.Pattern typePattern
char[] out
public WordDelimiterGraphFilterFactory(java.util.Map<java.lang.String,java.lang.String> args)
public void inform(ResourceLoader loader) throws java.io.IOException
ResourceLoaderAware
inform
in interface ResourceLoaderAware
java.io.IOException
public TokenFilter create(TokenStream input)
TokenFilterFactory
create
in class TokenFilterFactory
private byte[] parseTypes(java.util.List<java.lang.String> rules)
private java.lang.Byte parseType(java.lang.String s)
private java.lang.String parseString(java.lang.String s)