public abstract class BinaryDictionary extends Object implements Dictionary
| Modifier and Type | Class and Description |
|---|---|
static class |
BinaryDictionary.ResourceScheme
Used to specify where (dictionary) resources get loaded from.
|
| Modifier and Type | Field and Description |
|---|---|
static String |
DICT_FILENAME_SUFFIX |
static String |
DICT_HEADER |
static int |
HAS_BASEFORM
flag that the entry has baseform data.
|
static int |
HAS_PRONUNCIATION
flag that the entry has pronunciation data.
|
static int |
HAS_READING
flag that the entry has reading data.
|
static String |
POSDICT_FILENAME_SUFFIX |
static String |
POSDICT_HEADER |
static String |
TARGETMAP_FILENAME_SUFFIX |
static String |
TARGETMAP_HEADER |
static int |
VERSION |
INTERNAL_SEPARATOR| Modifier | Constructor and Description |
|---|---|
protected |
BinaryDictionary() |
protected |
BinaryDictionary(BinaryDictionary.ResourceScheme resourceScheme,
String resourcePath) |
| Modifier and Type | Method and Description |
|---|---|
String |
getBaseForm(int wordId,
char[] surfaceForm,
int off,
int len)
Get base form of word
|
static InputStream |
getClassResource(Class<?> clazz,
String suffix) |
String |
getInflectionForm(int wordId)
Get inflection form of tokens
|
String |
getInflectionType(int wordId)
Get inflection type of tokens
|
int |
getLeftId(int wordId)
Get left id of specified word
|
String |
getPartOfSpeech(int wordId)
Get Part-Of-Speech of tokens
|
String |
getPronunciation(int wordId,
char[] surface,
int off,
int len)
Get pronunciation of tokens
|
String |
getReading(int wordId,
char[] surface,
int off,
int len)
Get reading of tokens
|
static InputStream |
getResource(BinaryDictionary.ResourceScheme scheme,
String path) |
protected InputStream |
getResource(String suffix) |
int |
getRightId(int wordId)
Get right id of specified word
|
int |
getWordCost(int wordId)
Get word cost of specified word
|
void |
lookupWordIds(int sourceId,
IntsRef ref) |
public static final String DICT_FILENAME_SUFFIX
public static final String TARGETMAP_FILENAME_SUFFIX
public static final String POSDICT_FILENAME_SUFFIX
public static final String DICT_HEADER
public static final String TARGETMAP_HEADER
public static final String POSDICT_HEADER
public static final int VERSION
public static final int HAS_BASEFORM
public static final int HAS_READING
public static final int HAS_PRONUNCIATION
protected BinaryDictionary()
throws IOException
IOExceptionprotected BinaryDictionary(BinaryDictionary.ResourceScheme resourceScheme, String resourcePath) throws IOException
resourceScheme - - scheme for loading resources (FILE or CLASSPATH).resourcePath - - where to load resources (dictionaries) from. If null, with CLASSPATH scheme only, use
this class's name as the path.IOExceptionprotected final InputStream getResource(String suffix) throws IOException
IOExceptionpublic static final InputStream getResource(BinaryDictionary.ResourceScheme scheme, String path) throws IOException
IOExceptionpublic static final InputStream getClassResource(Class<?> clazz, String suffix) throws IOException
IOExceptionpublic void lookupWordIds(int sourceId,
IntsRef ref)
public int getLeftId(int wordId)
DictionarygetLeftId in interface Dictionarypublic int getRightId(int wordId)
DictionarygetRightId in interface Dictionarypublic int getWordCost(int wordId)
DictionarygetWordCost in interface Dictionarypublic String getBaseForm(int wordId, char[] surfaceForm, int off, int len)
DictionarygetBaseForm in interface DictionarywordId - word ID of tokenpublic String getReading(int wordId, char[] surface, int off, int len)
DictionarygetReading in interface DictionarywordId - word ID of tokenpublic String getPartOfSpeech(int wordId)
DictionarygetPartOfSpeech in interface DictionarywordId - word ID of tokenpublic String getPronunciation(int wordId, char[] surface, int off, int len)
DictionarygetPronunciation in interface DictionarywordId - word ID of tokenpublic String getInflectionType(int wordId)
DictionarygetInflectionType in interface DictionarywordId - word ID of tokenpublic String getInflectionForm(int wordId)
DictionarygetInflectionForm in interface DictionarywordId - word ID of tokenCopyright © 2000-2021 Apache Software Foundation. All Rights Reserved.