Property | Type | Description | |
---|---|---|---|
DEFAULT_ANALYZER | |||
EXTENDED_ANALYZER | |||
NON_WORD_PATTERN | Pattern | ||
WHITESPACE_PATTERN | Pattern |
Method | Description | |
---|---|---|
Equals ( object other ) : bool |
Indicates whether some other object is "equal to" this one.
|
|
GetHashCode ( ) : int |
Returns a hash code value for the object.
|
|
PatternAnalyzer ( System.Version matchVersion, Pattern pattern, bool toLowerCase, CharArraySet stopWords ) : System |
Constructs a new instance with the given parameters.
|
|
createComponents ( string fieldName, Reader reader ) : TokenStreamComponents |
Creates a token stream that tokenizes all the text in the given Reader; This implementation forwards to
|
|
createComponents ( string fieldName, Reader reader, string text ) : TokenStreamComponents |
Creates a token stream that tokenizes the given string into token terms (aka words).
|
Method | Description | |
---|---|---|
ToString ( Reader input ) : string |
Reads until end-of-stream and returns all read chars, finally closes the stream.
|
|
eq ( object o1, object o2 ) : bool |
equality where o1 and/or o2 can be null
|
|
eqPattern ( Pattern p1, Pattern p2 ) : bool |
assumes p1 and p2 are not null
|
public Equals ( object other ) : bool | ||
other | object | /// the reference object with which to compare. |
return | bool |
public PatternAnalyzer ( System.Version matchVersion, Pattern pattern, bool toLowerCase, CharArraySet stopWords ) : System | ||
matchVersion | System.Version | currently does nothing |
pattern | Pattern | /// a regular expression delimiting tokens |
toLowerCase | bool |
/// if true returns tokens after applying
/// String.toLowerCase() |
stopWords | CharArraySet |
/// if non-null, ignores all tokens that are contained in the
/// given stop set (after previously having applied toLowerCase()
/// if applicable). For example, created via
/// WordlistLoader.getWordSet(new File("samples/fulltext/stopwords.txt")
/// or other stop words
/// lists . |
return | System |
public createComponents ( string fieldName, Reader reader ) : TokenStreamComponents | ||
fieldName | string | /// the name of the field to tokenize (currently ignored). |
reader | Reader | /// the reader delivering the text |
return | TokenStreamComponents |
public createComponents ( string fieldName, Reader reader, string text ) : TokenStreamComponents | ||
fieldName | string | /// the name of the field to tokenize (currently ignored). |
reader | Reader | /// reader (e.g. charfilter) of the original text. can be null. |
text | string | /// the string to tokenize |
return | TokenStreamComponents |
public static PatternAnalyzer,org.apache.lucene.analysis.miscellaneous DEFAULT_ANALYZER | ||
return |
public static PatternAnalyzer,org.apache.lucene.analysis.miscellaneous EXTENDED_ANALYZER | ||
return |