|
|||||||||
PREV NEXT | FRAMES NO FRAMES |
org.apache.* |
---|
org.apache.lucene.analysis.ar.ArabicAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.ar.ArabicNormalizer | ||
---|---|---|
public static final char |
ALEF |
1575 |
public static final char |
ALEF_HAMZA_ABOVE |
1571 |
public static final char |
ALEF_HAMZA_BELOW |
1573 |
public static final char |
ALEF_MADDA |
1570 |
public static final char |
DAMMA |
1615 |
public static final char |
DAMMATAN |
1612 |
public static final char |
DOTLESS_YEH |
1609 |
public static final char |
FATHA |
1614 |
public static final char |
FATHATAN |
1611 |
public static final char |
HEH |
1607 |
public static final char |
KASRA |
1616 |
public static final char |
KASRATAN |
1613 |
public static final char |
SHADDA |
1617 |
public static final char |
SUKUN |
1618 |
public static final char |
TATWEEL |
1600 |
public static final char |
TEH_MARBUTA |
1577 |
public static final char |
YEH |
1610 |
org.apache.lucene.analysis.ar.ArabicStemmer | ||
---|---|---|
public static final char |
ALEF |
1575 |
public static final char |
BEH |
1576 |
public static final char |
FEH |
1601 |
public static final char |
HEH |
1607 |
public static final char |
KAF |
1603 |
public static final char |
LAM |
1604 |
public static final char |
NOON |
1606 |
public static final char |
TEH |
1578 |
public static final char |
TEH_MARBUTA |
1577 |
public static final char |
WAW |
1608 |
public static final char |
YEH |
1610 |
org.apache.lucene.analysis.bg.BulgarianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.br.BrazilianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.ca.CatalanAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.cjk.CJKAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.cjk.CJKBigramFilter | ||
---|---|---|
public static final String |
DOUBLE_TYPE |
"<DOUBLE>" |
public static final int |
HAN |
1 |
public static final int |
HANGUL |
8 |
public static final int |
HIRAGANA |
2 |
public static final int |
KATAKANA |
4 |
public static final String |
SINGLE_TYPE |
"<SINGLE>" |
org.apache.lucene.analysis.commongrams.CommonGramsFilter | ||
---|---|---|
public static final String |
GRAM_TYPE |
"gram" |
org.apache.lucene.analysis.compound.CompoundWordTokenFilterBase | ||
---|---|---|
public static final int |
DEFAULT_MAX_SUBWORD_SIZE |
15 |
public static final int |
DEFAULT_MIN_SUBWORD_SIZE |
2 |
public static final int |
DEFAULT_MIN_WORD_SIZE |
5 |
org.apache.lucene.analysis.compound.hyphenation.TernaryTree | ||
---|---|---|
protected static final int |
BLOCK_SIZE |
2048 |
org.apache.lucene.analysis.core.KeywordTokenizer | ||
---|---|---|
public static final int |
DEFAULT_BUFFER_SIZE |
256 |
org.apache.lucene.analysis.cz.CzechAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.da.DanishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"danish_stop.txt" |
org.apache.lucene.analysis.de.GermanAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"german_stop.txt" |
org.apache.lucene.analysis.el.GreekAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.es.SpanishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"spanish_stop.txt" |
org.apache.lucene.analysis.eu.BasqueAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.fa.PersianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
public static final String |
STOPWORDS_COMMENT |
"#" |
org.apache.lucene.analysis.fa.PersianNormalizer | ||
---|---|---|
public static final char |
FARSI_YEH |
1740 |
public static final char |
HAMZA_ABOVE |
1620 |
public static final char |
HEH |
1607 |
public static final char |
HEH_GOAL |
1729 |
public static final char |
HEH_YEH |
1728 |
public static final char |
KAF |
1603 |
public static final char |
KEHEH |
1705 |
public static final char |
YEH |
1610 |
public static final char |
YEH_BARREE |
1746 |
org.apache.lucene.analysis.fi.FinnishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"finnish_stop.txt" |
org.apache.lucene.analysis.fr.FrenchAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"french_stop.txt" |
org.apache.lucene.analysis.ga.IrishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.gl.GalicianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.hi.HindiAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.hu.HungarianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"hungarian_stop.txt" |
org.apache.lucene.analysis.hy.ArmenianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.id.IndonesianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.it.ItalianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"italian_stop.txt" |
org.apache.lucene.analysis.lv.LatvianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.miscellaneous.CapitalizationFilter | ||
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
2147483647 |
public static final int |
DEFAULT_MAX_WORD_COUNT |
2147483647 |
org.apache.lucene.analysis.miscellaneous.CapitalizationFilterFactory | ||
---|---|---|
public static final String |
FORCE_FIRST_LETTER |
"forceFirstLetter" |
public static final String |
KEEP |
"keep" |
public static final String |
KEEP_IGNORE_CASE |
"keepIgnoreCase" |
public static final String |
MAX_TOKEN_LENGTH |
"maxTokenLength" |
public static final String |
MAX_WORD_COUNT |
"maxWordCount" |
public static final String |
MIN_WORD_LENGTH |
"minWordLength" |
public static final String |
OK_PREFIX |
"okPrefix" |
public static final String |
ONLY_FIRST_WORD |
"onlyFirstWord" |
org.apache.lucene.analysis.miscellaneous.KeywordMarkerFilterFactory | ||
---|---|---|
public static final String |
PROTECTED_TOKENS |
"protected" |
org.apache.lucene.analysis.miscellaneous.LengthFilterFactory | ||
---|---|---|
public static final String |
MAX_KEY |
"max" |
public static final String |
MIN_KEY |
"min" |
org.apache.lucene.analysis.miscellaneous.LimitTokenCountFilterFactory | ||
---|---|---|
public static final String |
CONSUME_ALL_TOKENS_KEY |
"consumeAllTokens" |
public static final String |
MAX_TOKEN_COUNT_KEY |
"maxTokenCount" |
org.apache.lucene.analysis.miscellaneous.WordDelimiterFilter | ||
---|---|---|
public static final int |
ALPHA |
3 |
public static final int |
ALPHANUM |
7 |
public static final int |
CATENATE_ALL |
16 |
public static final int |
CATENATE_NUMBERS |
8 |
public static final int |
CATENATE_WORDS |
4 |
public static final int |
DIGIT |
4 |
public static final int |
GENERATE_NUMBER_PARTS |
2 |
public static final int |
GENERATE_WORD_PARTS |
1 |
public static final int |
LOWER |
1 |
public static final int |
PRESERVE_ORIGINAL |
32 |
public static final int |
SPLIT_ON_CASE_CHANGE |
64 |
public static final int |
SPLIT_ON_NUMERICS |
128 |
public static final int |
STEM_ENGLISH_POSSESSIVE |
256 |
public static final int |
SUBWORD_DELIM |
8 |
public static final int |
UPPER |
2 |
org.apache.lucene.analysis.miscellaneous.WordDelimiterFilterFactory | ||
---|---|---|
public static final String |
PROTECTED_TOKENS |
"protected" |
public static final String |
TYPES |
"types" |
org.apache.lucene.analysis.miscellaneous.WordDelimiterIterator | ||
---|---|---|
public static final int |
DONE |
-1 |
org.apache.lucene.analysis.ngram.EdgeNGramTokenFilter | ||
---|---|---|
public static final int |
DEFAULT_MAX_GRAM_SIZE |
1 |
public static final int |
DEFAULT_MIN_GRAM_SIZE |
1 |
org.apache.lucene.analysis.ngram.EdgeNGramTokenizer | ||
---|---|---|
public static final int |
DEFAULT_MAX_GRAM_SIZE |
1 |
public static final int |
DEFAULT_MIN_GRAM_SIZE |
1 |
org.apache.lucene.analysis.ngram.NGramTokenFilter | ||
---|---|---|
public static final int |
DEFAULT_MAX_NGRAM_SIZE |
2 |
public static final int |
DEFAULT_MIN_NGRAM_SIZE |
1 |
org.apache.lucene.analysis.ngram.NGramTokenizer | ||
---|---|---|
public static final int |
DEFAULT_MAX_NGRAM_SIZE |
2 |
public static final int |
DEFAULT_MIN_NGRAM_SIZE |
1 |
org.apache.lucene.analysis.nl.DutchAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"dutch_stop.txt" |
org.apache.lucene.analysis.no.NorwegianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"norwegian_stop.txt" |
org.apache.lucene.analysis.path.PathHierarchyTokenizer | ||
---|---|---|
public static final char |
DEFAULT_DELIMITER |
47 |
public static final int |
DEFAULT_SKIP |
0 |
org.apache.lucene.analysis.path.ReversePathHierarchyTokenizer | ||
---|---|---|
public static final char |
DEFAULT_DELIMITER |
47 |
public static final int |
DEFAULT_SKIP |
0 |
org.apache.lucene.analysis.pattern.PatternReplaceCharFilter | ||
---|---|---|
public static final int |
DEFAULT_MAX_BLOCK_CHARS |
10000 |
org.apache.lucene.analysis.pattern.PatternTokenizerFactory | ||
---|---|---|
public static final String |
GROUP |
"group" |
public static final String |
PATTERN |
"pattern" |
org.apache.lucene.analysis.payloads.DelimitedPayloadTokenFilter | ||
---|---|---|
public static final char |
DEFAULT_DELIMITER |
124 |
org.apache.lucene.analysis.payloads.DelimitedPayloadTokenFilterFactory | ||
---|---|---|
public static final String |
DELIMITER_ATTR |
"delimiter" |
public static final String |
ENCODER_ATTR |
"encoder" |
org.apache.lucene.analysis.pt.PortugueseAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"portuguese_stop.txt" |
org.apache.lucene.analysis.query.QueryAutoStopWordAnalyzer | ||
---|---|---|
public static final float |
defaultMaxDocFreqPercent |
0.4000000059604645f |
org.apache.lucene.analysis.reverse.ReverseStringFilter | ||
---|---|---|
public static final char |
INFORMATION_SEPARATOR_MARKER |
31 |
public static final char |
PUA_EC00_MARKER |
60416 |
public static final char |
RTL_DIRECTION_MARKER |
8207 |
public static final char |
START_OF_HEADING_MARKER |
1 |
org.apache.lucene.analysis.ro.RomanianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.ru.RussianAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"russian_stop.txt" |
org.apache.lucene.analysis.shingle.ShingleFilter | ||
---|---|---|
public static final int |
DEFAULT_MAX_SHINGLE_SIZE |
2 |
public static final int |
DEFAULT_MIN_SHINGLE_SIZE |
2 |
public static final String |
DEFAULT_TOKEN_TYPE |
"shingle" |
public static final String |
TOKEN_SEPARATOR |
" " |
org.apache.lucene.analysis.sinks.DateRecognizerSinkFilter | ||
---|---|---|
public static final String |
DATE_TYPE |
"date" |
org.apache.lucene.analysis.snowball.SnowballPorterFilterFactory | ||
---|---|---|
public static final String |
PROTECTED_TOKENS |
"protected" |
org.apache.lucene.analysis.standard.ClassicAnalyzer | ||
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
255 |
org.apache.lucene.analysis.standard.ClassicTokenizer | ||
---|---|---|
public static final int |
ACRONYM |
2 |
public static final int |
ACRONYM_DEP |
8 |
public static final int |
ALPHANUM |
0 |
public static final int |
APOSTROPHE |
1 |
public static final int |
CJ |
7 |
public static final int |
COMPANY |
3 |
public static final int |
EMAIL |
4 |
public static final int |
HOST |
5 |
public static final int |
NUM |
6 |
org.apache.lucene.analysis.standard.StandardAnalyzer | ||
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
255 |
org.apache.lucene.analysis.standard.StandardTokenizer | ||
---|---|---|
public static final int |
ACRONYM |
2 |
public static final int |
ACRONYM_DEP |
8 |
public static final int |
ALPHANUM |
0 |
public static final int |
APOSTROPHE |
1 |
public static final int |
CJ |
7 |
public static final int |
COMPANY |
3 |
public static final int |
EMAIL |
4 |
public static final int |
HANGUL |
13 |
public static final int |
HIRAGANA |
11 |
public static final int |
HOST |
5 |
public static final int |
IDEOGRAPHIC |
10 |
public static final int |
KATAKANA |
12 |
public static final int |
NUM |
6 |
public static final int |
SOUTHEAST_ASIAN |
9 |
org.apache.lucene.analysis.standard.StandardTokenizerImpl | ||
---|---|---|
public static final int |
HANGUL_TYPE |
13 |
public static final int |
HIRAGANA_TYPE |
11 |
public static final int |
IDEOGRAPHIC_TYPE |
10 |
public static final int |
KATAKANA_TYPE |
12 |
public static final int |
NUMERIC_TYPE |
6 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
9 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.StandardTokenizerInterface | ||
---|---|---|
public static final int |
YYEOF |
-1 |
org.apache.lucene.analysis.standard.UAX29URLEmailAnalyzer | ||
---|---|---|
public static final int |
DEFAULT_MAX_TOKEN_LENGTH |
255 |
org.apache.lucene.analysis.standard.UAX29URLEmailTokenizer | ||
---|---|---|
public static final int |
ALPHANUM |
0 |
public static final int |
EMAIL |
8 |
public static final int |
HANGUL |
6 |
public static final int |
HIRAGANA |
4 |
public static final int |
IDEOGRAPHIC |
3 |
public static final int |
KATAKANA |
5 |
public static final int |
NUM |
1 |
public static final int |
SOUTHEAST_ASIAN |
2 |
public static final int |
URL |
7 |
org.apache.lucene.analysis.standard.UAX29URLEmailTokenizerImpl | ||
---|---|---|
public static final int |
EMAIL_TYPE |
8 |
public static final int |
HANGUL_TYPE |
6 |
public static final int |
HIRAGANA_TYPE |
4 |
public static final int |
IDEOGRAPHIC_TYPE |
3 |
public static final int |
KATAKANA_TYPE |
5 |
public static final int |
NUMERIC_TYPE |
1 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
2 |
public static final int |
URL_TYPE |
7 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.std31.StandardTokenizerImpl31 | ||
---|---|---|
public static final int |
HANGUL_TYPE |
13 |
public static final int |
HIRAGANA_TYPE |
11 |
public static final int |
IDEOGRAPHIC_TYPE |
10 |
public static final int |
KATAKANA_TYPE |
12 |
public static final int |
NUMERIC_TYPE |
6 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
9 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.std31.UAX29URLEmailTokenizerImpl31 | ||
---|---|---|
public static final int |
EMAIL_TYPE |
8 |
public static final int |
HANGUL_TYPE |
6 |
public static final int |
HIRAGANA_TYPE |
4 |
public static final int |
IDEOGRAPHIC_TYPE |
3 |
public static final int |
KATAKANA_TYPE |
5 |
public static final int |
NUMERIC_TYPE |
1 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
2 |
public static final int |
URL_TYPE |
7 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.std34.StandardTokenizerImpl34 | ||
---|---|---|
public static final int |
HANGUL_TYPE |
13 |
public static final int |
HIRAGANA_TYPE |
11 |
public static final int |
IDEOGRAPHIC_TYPE |
10 |
public static final int |
KATAKANA_TYPE |
12 |
public static final int |
NUMERIC_TYPE |
6 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
9 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.std34.UAX29URLEmailTokenizerImpl34 | ||
---|---|---|
public static final int |
EMAIL_TYPE |
8 |
public static final int |
HANGUL_TYPE |
6 |
public static final int |
HIRAGANA_TYPE |
4 |
public static final int |
IDEOGRAPHIC_TYPE |
3 |
public static final int |
KATAKANA_TYPE |
5 |
public static final int |
NUMERIC_TYPE |
1 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
2 |
public static final int |
URL_TYPE |
7 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.standard.std36.UAX29URLEmailTokenizerImpl36 | ||
---|---|---|
public static final int |
EMAIL_TYPE |
8 |
public static final int |
HANGUL_TYPE |
6 |
public static final int |
HIRAGANA_TYPE |
4 |
public static final int |
IDEOGRAPHIC_TYPE |
3 |
public static final int |
KATAKANA_TYPE |
5 |
public static final int |
NUMERIC_TYPE |
1 |
public static final int |
SOUTH_EAST_ASIAN_TYPE |
2 |
public static final int |
URL_TYPE |
7 |
public static final int |
WORD_TYPE |
0 |
public static final int |
YYEOF |
-1 |
public static final int |
YYINITIAL |
0 |
org.apache.lucene.analysis.sv.SwedishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"swedish_stop.txt" |
org.apache.lucene.analysis.synonym.SynonymFilter | ||
---|---|---|
public static final String |
TYPE_SYNONYM |
"SYNONYM" |
org.apache.lucene.analysis.synonym.SynonymMap | ||
---|---|---|
public static final char |
WORD_SEPARATOR |
0 |
org.apache.lucene.analysis.th.ThaiAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.tr.TurkishAnalyzer | ||
---|---|---|
public static final String |
DEFAULT_STOPWORD_FILE |
"stopwords.txt" |
org.apache.lucene.analysis.wikipedia.WikipediaTokenizer | ||
---|---|---|
public static final int |
ACRONYM_ID |
2 |
public static final int |
ALPHANUM_ID |
0 |
public static final int |
APOSTROPHE_ID |
1 |
public static final String |
BOLD |
"b" |
public static final int |
BOLD_ID |
12 |
public static final String |
BOLD_ITALICS |
"bi" |
public static final int |
BOLD_ITALICS_ID |
14 |
public static final int |
BOTH |
2 |
public static final String |
CATEGORY |
"c" |
public static final int |
CATEGORY_ID |
11 |
public static final String |
CITATION |
"ci" |
public static final int |
CITATION_ID |
10 |
public static final int |
CJ_ID |
7 |
public static final int |
COMPANY_ID |
3 |
public static final int |
EMAIL_ID |
4 |
public static final String |
EXTERNAL_LINK |
"el" |
public static final int |
EXTERNAL_LINK_ID |
9 |
public static final String |
EXTERNAL_LINK_URL |
"elu" |
public static final int |
EXTERNAL_LINK_URL_ID |
17 |
public static final String |
HEADING |
"h" |
public static final int |
HEADING_ID |
15 |
public static final int |
HOST_ID |
5 |
public static final String |
INTERNAL_LINK |
"il" |
public static final int |
INTERNAL_LINK_ID |
8 |
public static final String |
ITALICS |
"i" |
public static final int |
ITALICS_ID |
13 |
public static final int |
NUM_ID |
6 |
public static final String |
SUB_HEADING |
"sh" |
public static final int |
SUB_HEADING_ID |
16 |
public static final int |
TOKENS_ONLY |
0 |
public static final int |
UNTOKENIZED_ONLY |
1 |
public static final int |
UNTOKENIZED_TOKEN_FLAG |
1 |
|
|||||||||
PREV NEXT | FRAMES NO FRAMES |