Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"arabicNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
ALEF |
1575 |
public static final char |
ALEF_HAMZA_ABOVE |
1571 |
public static final char |
ALEF_HAMZA_BELOW |
1573 |
public static final char |
ALEF_MADDA |
1570 |
public static final char |
DAMMA |
1615 |
public static final char |
DAMMATAN |
1612 |
public static final char |
DOTLESS_YEH |
1609 |
public static final char |
FATHA |
1614 |
public static final char |
FATHATAN |
1611 |
public static final char |
HEH |
1607 |
public static final char |
KASRA |
1616 |
public static final char |
KASRATAN |
1613 |
public static final char |
SHADDA |
1617 |
public static final char |
SUKUN |
1618 |
public static final char |
TATWEEL |
1600 |
public static final char |
TEH_MARBUTA |
1577 |
public static final char |
YEH |
1610 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"arabicStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
ALEF |
1575 |
public static final char |
BEH |
1576 |
public static final char |
FEH |
1601 |
public static final char |
HEH |
1607 |
public static final char |
KAF |
1603 |
public static final char |
LAM |
1604 |
public static final char |
NOON |
1606 |
public static final char |
TEH |
1578 |
public static final char |
TEH_MARBUTA |
1577 |
public static final char |
WAW |
1608 |
public static final char |
YEH |
1610 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"bulgarianStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"bengaliNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"bengaliStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"brazilianStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"htmlStrip" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"mapping" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DOUBLE_TYPE |
"<DOUBLE>" |
public static final int |
HAN |
1 |
public static final int |
HANGUL |
8 |
public static final int |
HIRAGANA |
2 |
public static final int |
KATAKANA |
4 |
public static final String |
SINGLE_TYPE |
"<SINGLE>" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"cjkBigram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"cjkWidth" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"soraniNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"soraniStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
GRAM_TYPE |
"gram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"commonGrams" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"commonGramsQuery" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_SUBWORD_SIZE |
15 |
public static final int |
DEFAULT_MIN_SUBWORD_SIZE |
2 |
public static final int |
DEFAULT_MIN_WORD_SIZE |
5 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"dictionaryCompoundWord" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hyphenationCompoundWord" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
BLOCK_SIZE |
2048 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"decimalDigit" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"flattenGraph" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_BUFFER_SIZE |
256 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"keyword" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"letter" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"lowercase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
FORMAT_SNOWBALL |
"snowball" |
public static final String |
FORMAT_WORDSET |
"wordset" |
public static final String |
NAME |
"stop" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"type" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"uppercase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"whitespace" |
public static final String |
RULE_JAVA |
"java" |
public static final String |
RULE_UNICODE |
"unicode" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"czechStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"danish_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"german_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"germanLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"germanMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"germanNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"germanStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"greekLowercase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"greekStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"englishMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"englishPossessive" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"kStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"porterStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"spanish_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"spanishLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"spanishMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
public static final String |
STOPWORDS_COMMENT |
"#" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"persian" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"persianNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
FARSI_YEH |
1740 |
public static final char |
HAMZA_ABOVE |
1620 |
public static final char |
HEH |
1607 |
public static final char |
HEH_GOAL |
1729 |
public static final char |
HEH_YEH |
1728 |
public static final char |
KAF |
1603 |
public static final char |
KEHEH |
1705 |
public static final char |
YEH |
1610 |
public static final char |
YEH_BARREE |
1746 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"finnish_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"finnishLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"french_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"frenchLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"frenchMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"irishLowercase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"galicianMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"galicianStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hindiNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hindiStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"hungarian_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hungarianLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hunspellStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"indonesianStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"indicNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"italian_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"italianLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"latvianStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_BUCKET_COUNT |
512 |
public static final int |
DEFAULT_HASH_COUNT |
1 |
public static final int |
DEFAULT_HASH_SET_SIZE |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"minHash" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"asciiFolding" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
2147483647 |
public static final int |
DEFAULT_MAX_WORD_COUNT |
2147483647 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
FORCE_FIRST_LETTER |
"forceFirstLetter" |
public static final String |
KEEP |
"keep" |
public static final String |
KEEP_IGNORE_CASE |
"keepIgnoreCase" |
public static final String |
MAX_TOKEN_LENGTH |
"maxTokenLength" |
public static final String |
MAX_WORD_COUNT |
"maxWordCount" |
public static final String |
MIN_WORD_LENGTH |
"minWordLength" |
public static final String |
NAME |
"capitalization" |
public static final String |
OK_PREFIX |
"okPrefix" |
public static final String |
ONLY_FIRST_WORD |
"onlyFirstWord" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
MAX_KEY |
"max" |
public static final String |
MIN_KEY |
"min" |
public static final String |
NAME |
"codepointCount" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_GRAPH_EXPANSIONS |
10000 |
public static final boolean |
DEFAULT_PRESERVE_POSITION_INCREMENTS |
true |
public static final boolean |
DEFAULT_PRESERVE_SEP |
true |
public static final int |
SEP_LABEL |
31 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"concatenateGraph" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"conditional" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DATE_TYPE |
"date" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DATE_PATTERN |
"datePattern" |
public static final String |
LOCALE |
"locale" |
public static final String |
NAME |
"dateRecognizer" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
DEFAULT_DELIMITER |
124 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DELIMITER_ATTR |
"delimiter" |
public static final String |
NAME |
"delimitedTermFrequency" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_OUTPUT_TOKEN_SIZE |
1024 |
public static final char |
DEFAULT_SEPARATOR |
32 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
MAX_OUTPUT_TOKEN_SIZE_KEY |
"maxOutputTokenSize" |
public static final String |
NAME |
"fingerprint" |
public static final String |
SEPARATOR_KEY |
"separator" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"fixBrokenOffsets" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"hyphenatedWords" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"keepWord" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"keywordMarker" |
public static final String |
PATTERN |
"pattern" |
public static final String |
PROTECTED_TOKENS |
"protected" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"keywordRepeat" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
MAX_KEY |
"max" |
public static final String |
MIN_KEY |
"min" |
public static final String |
NAME |
"length" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
CONSUME_ALL_TOKENS_KEY |
"consumeAllTokens" |
public static final String |
MAX_TOKEN_COUNT_KEY |
"maxTokenCount" |
public static final String |
NAME |
"limitTokenCount" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
CONSUME_ALL_TOKENS_KEY |
"consumeAllTokens" |
public static final String |
MAX_START_OFFSET |
"maxStartOffset" |
public static final String |
NAME |
"limitTokenOffset" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
CONSUME_ALL_TOKENS_KEY |
"consumeAllTokens" |
public static final String |
MAX_TOKEN_POSITION_KEY |
"maxTokenPosition" |
public static final String |
NAME |
"limitTokenPosition" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
FILTER_ARG_SEPARATOR |
46 |
public static final char |
FILTER_NAME_ID_SEPARATOR |
45 |
public static final String |
NAME |
"protectedTerm" |
public static final String |
PROTECTED_TERMS |
"protected" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"removeDuplicates" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"scandinavianFolding" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"scandinavianNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"stemmerOverride" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"trim" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"truncate" |
public static final String |
PREFIX_LENGTH_KEY |
"prefixLength" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"typeAsSynonym" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ALPHA |
3 |
public static final int |
ALPHANUM |
7 |
public static final int |
CATENATE_ALL |
16 |
public static final int |
CATENATE_NUMBERS |
8 |
public static final int |
CATENATE_WORDS |
4 |
public static final int |
DIGIT |
4 |
public static final int |
GENERATE_NUMBER_PARTS |
2 |
public static final int |
GENERATE_WORD_PARTS |
1 |
public static final int |
IGNORE_KEYWORDS |
512 |
public static final int |
LOWER |
1 |
public static final int |
PRESERVE_ORIGINAL |
32 |
public static final int |
SPLIT_ON_CASE_CHANGE |
64 |
public static final int |
SPLIT_ON_NUMERICS |
128 |
public static final int |
STEM_ENGLISH_POSSESSIVE |
256 |
public static final int |
SUBWORD_DELIM |
8 |
public static final int |
UPPER |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"wordDelimiter" |
public static final String |
PROTECTED_TOKENS |
"protected" |
public static final String |
TYPES |
"types" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
CATENATE_ALL |
16 |
public static final int |
CATENATE_NUMBERS |
8 |
public static final int |
CATENATE_WORDS |
4 |
public static final int |
GENERATE_NUMBER_PARTS |
2 |
public static final int |
GENERATE_WORD_PARTS |
1 |
public static final int |
IGNORE_KEYWORDS |
512 |
public static final int |
PRESERVE_ORIGINAL |
32 |
public static final int |
SPLIT_ON_CASE_CHANGE |
64 |
public static final int |
SPLIT_ON_NUMERICS |
128 |
public static final int |
STEM_ENGLISH_POSSESSIVE |
256 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"wordDelimiterGraph" |
public static final String |
OFFSETS |
"adjustOffsets" |
public static final String |
PROTECTED_TOKENS |
"protected" |
public static final String |
TYPES |
"types" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ALPHA |
3 |
public static final int |
ALPHANUM |
7 |
public static final int |
DONE |
-1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"edgeNGram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final boolean |
DEFAULT_PRESERVE_ORIGINAL |
false |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_GRAM_SIZE |
1 |
public static final int |
DEFAULT_MIN_GRAM_SIZE |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"edgeNGram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"nGram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final boolean |
DEFAULT_PRESERVE_ORIGINAL |
false |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_NGRAM_SIZE |
2 |
public static final int |
DEFAULT_MIN_NGRAM_SIZE |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"nGram" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"dutch_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"norwegian_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"norwegianLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
BOKMAAL |
1 |
public static final int |
NYNORSK |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"norwegianMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
DEFAULT_DELIMITER |
47 |
public static final int |
DEFAULT_SKIP |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"pathHierarchy" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
DEFAULT_DELIMITER |
47 |
public static final int |
DEFAULT_SKIP |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"patternCaptureGroup" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"patternReplace" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"patternReplace" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
GROUP |
"group" |
public static final String |
NAME |
"pattern" |
public static final String |
PATTERN |
"pattern" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"simplePatternSplit" |
public static final String |
PATTERN |
"pattern" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"simplePattern" |
public static final String |
PATTERN |
"pattern" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
DEFAULT_DELIMITER |
124 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DELIMITER_ATTR |
"delimiter" |
public static final String |
ENCODER_ATTR |
"encoder" |
public static final String |
NAME |
"delimitedPayload" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"numericPayload" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"tokenOffsetPayload" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"typeAsPayload" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"portuguese_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"portugueseLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"portugueseMinimalStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"portugueseStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final float |
defaultMaxDocFreqPercent |
0.4000000059604645f |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
INFORMATION_SEPARATOR_MARKER |
31 |
public static final char |
PUA_EC00_MARKER |
60416 |
public static final char |
RTL_DIRECTION_MARKER |
8207 |
public static final char |
START_OF_HEADING_MARKER |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"reverseString" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"russian_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"russianLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"fixedShingle" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_FILLER_TOKEN |
"_" |
public static final int |
DEFAULT_MAX_SHINGLE_SIZE |
2 |
public static final int |
DEFAULT_MIN_SHINGLE_SIZE |
2 |
public static final String |
DEFAULT_TOKEN_SEPARATOR |
" " |
public static final String |
DEFAULT_TOKEN_TYPE |
"shingle" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"shingle" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"snowballPorter" |
public static final String |
PROTECTED_TOKENS |
"protected" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"serbianNormalization" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
255 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"classic" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ACRONYM |
2 |
public static final int |
ACRONYM_DEP |
8 |
public static final int |
ALPHANUM |
0 |
public static final int |
APOSTROPHE |
1 |
public static final int |
CJ |
7 |
public static final int |
COMPANY |
3 |
public static final int |
EMAIL |
4 |
public static final int |
HOST |
5 |
public static final int |
NUM |
6 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"classic" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"standard" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
255 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ALPHANUM |
0 |
public static final int |
EMAIL |
8 |
public static final int |
EMOJI |
9 |
public static final int |
HANGUL |
6 |
public static final int |
HIRAGANA |
4 |
public static final int |
IDEOGRAPHIC |
3 |
public static final int |
KATAKANA |
5 |
public static final int |
MAX_TOKEN_LENGTH_LIMIT |
1048576 |
public static final int |
NUM |
1 |
public static final int |
SOUTHEAST_ASIAN |
2 |
public static final int |
URL |
7 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"uax29UrlEmail" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
AVOID_BAD_URL |
2 |
public static final int |
EMAIL_TYPE |
8 |
public static final int |
EMOJI_TYPE |
9 |
public static final int |
HANGUL_TYPE |
6 |
public static final int |
HIRAGANA_TYPE |
4 |
public static final int |
IDEOGRAPHIC_TYPE |
3 |
public static final int |
KATAKANA_TYPE |
5 |
public static final int |
NUMERIC_TYPE |
1 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
2 |
public static final int |
URL_TYPE |
7 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"swedish_stop.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"swedishLightStem" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
TYPE_SYNONYM |
"SYNONYM" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"synonym" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
TYPE_SYNONYM |
"SYNONYM" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"synonymGraph" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
WORD_SEPARATOR |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"thai" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"apostrophe" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"turkishLowercase" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
LUCENE_MATCH_VERSION_PARAM |
"luceneMatchVersion" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEFAULT_MAX_WORD_LEN |
255 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"elision" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
BUFFERMAX |
1024 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
UNICODE_VERSION |
"11.0.0.0" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ACRONYM_ID |
2 |
public static final int |
ALPHANUM_ID |
0 |
public static final int |
APOSTROPHE_ID |
1 |
public static final String |
BOLD |
"b" |
public static final int |
BOLD_ID |
12 |
public static final String |
BOLD_ITALICS |
"bi" |
public static final int |
BOLD_ITALICS_ID |
14 |
public static final int |
BOTH |
2 |
public static final String |
CATEGORY |
"c" |
public static final int |
CATEGORY_ID |
11 |
public static final String |
CITATION |
"ci" |
public static final int |
CITATION_ID |
10 |
public static final int |
CJ_ID |
7 |
public static final int |
COMPANY_ID |
3 |
public static final int |
EMAIL_ID |
4 |
public static final String |
EXTERNAL_LINK |
"el" |
public static final int |
EXTERNAL_LINK_ID |
9 |
public static final String |
EXTERNAL_LINK_URL |
"elu" |
public static final int |
EXTERNAL_LINK_URL_ID |
17 |
public static final String |
HEADING |
"h" |
public static final int |
HEADING_ID |
15 |
public static final int |
HOST_ID |
5 |
public static final String |
INTERNAL_LINK |
"il" |
public static final int |
INTERNAL_LINK_ID |
8 |
public static final String |
ITALICS |
"i" |
public static final int |
ITALICS_ID |
13 |
public static final int |
NUM_ID |
6 |
public static final String |
SUB_HEADING |
"sh" |
public static final int |
SUB_HEADING_ID |
16 |
public static final int |
TOKENS_ONLY |
0 |
public static final int |
UNTOKENIZED_ONLY |
1 |
public static final int |
UNTOKENIZED_TOKEN_FLAG |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final String |
NAME |
"wikipedia" |
public static final String |
TOKEN_OUTPUT |
"tokenOutput" |
public static final String |
UNTOKENIZED_TYPES |
"untokenizedTypes" |
Copyright © 2000-2019 Apache Software Foundation. All Rights Reserved.