public abstract class BinaryDictionary extends java.lang.Object implements Dictionary
Modifier and Type | Field and Description |
---|---|
static java.lang.String |
DICT_FILENAME_SUFFIX |
static java.lang.String |
DICT_HEADER |
static int |
HAS_BASEFORM
flag that the entry has baseform data.
|
static int |
HAS_PRONUNCIATION
flag that the entry has pronunciation data.
|
static int |
HAS_READING
flag that the entry has reading data.
|
static java.lang.String |
POSDICT_FILENAME_SUFFIX |
static java.lang.String |
POSDICT_HEADER |
static java.lang.String |
TARGETMAP_FILENAME_SUFFIX |
static java.lang.String |
TARGETMAP_HEADER |
static int |
VERSION |
INTERNAL_SEPARATOR
Modifier | Constructor and Description |
---|---|
protected |
BinaryDictionary() |
Modifier and Type | Method and Description |
---|---|
java.lang.String |
getBaseForm(int wordId,
char[] surfaceForm,
int off,
int len)
Get base form of word
|
static java.io.InputStream |
getClassResource(java.lang.Class<?> clazz,
java.lang.String suffix) |
java.lang.String |
getInflectionForm(int wordId)
Get inflection form of tokens
|
java.lang.String |
getInflectionType(int wordId)
Get inflection type of tokens
|
int |
getLeftId(int wordId)
Get left id of specified word
|
java.lang.String |
getPartOfSpeech(int wordId)
Get Part-Of-Speech of tokens
|
java.lang.String |
getPronunciation(int wordId,
char[] surface,
int off,
int len)
Get pronunciation of tokens
|
java.lang.String |
getReading(int wordId,
char[] surface,
int off,
int len)
Get reading of tokens
|
protected java.io.InputStream |
getResource(java.lang.String suffix) |
int |
getRightId(int wordId)
Get right id of specified word
|
int |
getWordCost(int wordId)
Get word cost of specified word
|
void |
lookupWordIds(int sourceId,
IntsRef ref) |
public static final java.lang.String DICT_FILENAME_SUFFIX
public static final java.lang.String TARGETMAP_FILENAME_SUFFIX
public static final java.lang.String POSDICT_FILENAME_SUFFIX
public static final java.lang.String DICT_HEADER
public static final java.lang.String TARGETMAP_HEADER
public static final java.lang.String POSDICT_HEADER
public static final int VERSION
public static final int HAS_BASEFORM
public static final int HAS_READING
public static final int HAS_PRONUNCIATION
protected BinaryDictionary() throws java.io.IOException
java.io.IOException
protected final java.io.InputStream getResource(java.lang.String suffix) throws java.io.IOException
java.io.IOException
public static final java.io.InputStream getClassResource(java.lang.Class<?> clazz, java.lang.String suffix) throws java.io.IOException
java.io.IOException
public void lookupWordIds(int sourceId, IntsRef ref)
public int getLeftId(int wordId)
Dictionary
getLeftId
in interface Dictionary
public int getRightId(int wordId)
Dictionary
getRightId
in interface Dictionary
public int getWordCost(int wordId)
Dictionary
getWordCost
in interface Dictionary
public java.lang.String getBaseForm(int wordId, char[] surfaceForm, int off, int len)
Dictionary
getBaseForm
in interface Dictionary
wordId
- word ID of tokenpublic java.lang.String getReading(int wordId, char[] surface, int off, int len)
Dictionary
getReading
in interface Dictionary
wordId
- word ID of tokenpublic java.lang.String getPartOfSpeech(int wordId)
Dictionary
getPartOfSpeech
in interface Dictionary
wordId
- word ID of tokenpublic java.lang.String getPronunciation(int wordId, char[] surface, int off, int len)
Dictionary
getPronunciation
in interface Dictionary
wordId
- word ID of tokenpublic java.lang.String getInflectionType(int wordId)
Dictionary
getInflectionType
in interface Dictionary
wordId
- word ID of tokenpublic java.lang.String getInflectionForm(int wordId)
Dictionary
getInflectionForm
in interface Dictionary
wordId
- word ID of tokenCopyright © 2000–2019 The Apache Software Foundation. All rights reserved.