public class MorphModel extends Model
| Modifier and Type | Class and Description |
|---|---|
static class |
MorphModel.MorphEntry |
BORDER_SYMBOL_, EMPTY_SYMBOL_| Constructor and Description |
|---|
MorphModel() |
| Modifier and Type | Method and Description |
|---|---|
void |
addIndexes(Word word,
boolean insert) |
SymbolTable<java.lang.Character> |
getCharTable() |
RankerModel |
getLemmaModel() |
boolean |
getLemmaUseMorph() |
boolean |
getMarganlizeLemmas() |
int |
getMaxSignature() |
int |
getNumShapes() |
int |
getNumSubTags() |
static java.util.List<java.util.List<java.lang.Integer>> |
getOpenPosTagClassesCrossValidation(java.util.Collection<Sequence> sentences,
int num_folds,
java.util.List<SymbolTable<java.lang.String>> tag_tables) |
SymbolTable<java.lang.String> |
getShapeTable() |
int[] |
getTagCandidates(Sequence sequence,
int index,
State state) |
int[][][] |
getTagToSubTags() |
SymbolTable<java.lang.String> |
getTokenFeatureTable() |
SymbolTable<java.lang.String> |
getWeightedTokenFeatureTable() |
SymbolTable<java.lang.String> |
getWordTable() |
boolean |
hasBeenObserved(int form_index,
int level,
int tag_index) |
void |
init(MorphOptions options,
java.util.Collection<Sequence> sentences) |
boolean |
isOOV(int form_index) |
boolean |
isRare(int word) |
void |
setLemmaCandidates(State state,
boolean preprune) |
void |
setLemmaCandidates(Token token,
State state,
boolean preprune,
boolean training) |
void |
setVerbose(boolean verbose) |
static Tagger |
train(MorphOptions options,
java.util.Collection<Sequence> train_sentences,
java.util.Collection<Sequence> test_sentences) |
static Tagger |
train(MorphOptions options,
java.util.List<Sequence> train_sequences) |
static Tagger |
trainOptimal(MorphOptions options,
java.util.Collection<Sequence> train_sentences,
java.util.Collection<Sequence> test_sentences,
java.util.List<java.lang.String> parameters,
java.util.List<java.util.List<java.lang.String>> values_list,
java.util.List<MorphModel.MorphEntry> results) |
static Tagger |
trainOptimal(MorphOptions options,
java.util.Collection<Sequence> train_sentences,
java.util.Collection<Sequence> test_sentences,
java.lang.String parameter,
java.util.Collection<java.lang.String> values,
java.util.List<MorphModel.MorphEntry> results) |
static Tagger |
trainOptimal(MorphOptions options,
java.util.List<Sequence> train_sentences,
java.util.List<Sequence> test_sentences) |
getBoundaryIndex, getBoundaryState, getCategoryTable, getOptions, getOrder, getTagTables, initpublic void init(MorphOptions options, java.util.Collection<Sequence> sentences)
public boolean hasBeenObserved(int form_index,
int level,
int tag_index)
public static java.util.List<java.util.List<java.lang.Integer>> getOpenPosTagClassesCrossValidation(java.util.Collection<Sequence> sentences, int num_folds, java.util.List<SymbolTable<java.lang.String>> tag_tables)
public void addIndexes(Word word, boolean insert)
public boolean isRare(int word)
public SymbolTable<java.lang.String> getWordTable()
public static Tagger trainOptimal(MorphOptions options, java.util.Collection<Sequence> train_sentences, java.util.Collection<Sequence> test_sentences, java.util.List<java.lang.String> parameters, java.util.List<java.util.List<java.lang.String>> values_list, java.util.List<MorphModel.MorphEntry> results)
public static Tagger trainOptimal(MorphOptions options, java.util.Collection<Sequence> train_sentences, java.util.Collection<Sequence> test_sentences, java.lang.String parameter, java.util.Collection<java.lang.String> values, java.util.List<MorphModel.MorphEntry> results)
public static Tagger trainOptimal(MorphOptions options, java.util.List<Sequence> train_sentences, java.util.List<Sequence> test_sentences)
public static Tagger train(MorphOptions options, java.util.Collection<Sequence> train_sentences, java.util.Collection<Sequence> test_sentences)
public SymbolTable<java.lang.Character> getCharTable()
public int getNumShapes()
public SymbolTable<java.lang.String> getShapeTable()
public boolean isOOV(int form_index)
public int getNumSubTags()
public SymbolTable<java.lang.String> getTokenFeatureTable()
public SymbolTable<java.lang.String> getWeightedTokenFeatureTable()
public int[] getTagCandidates(Sequence sequence, int index, State state)
getTagCandidates in class Modelpublic int[][][] getTagToSubTags()
public void setVerbose(boolean verbose)
public int getMaxSignature()
public static Tagger train(MorphOptions options, java.util.List<Sequence> train_sequences)
public void setLemmaCandidates(Token token, State state, boolean preprune, boolean training)
setLemmaCandidates in class Modelpublic void setLemmaCandidates(State state, boolean preprune)
setLemmaCandidates in class Modelpublic RankerModel getLemmaModel()
public boolean getMarganlizeLemmas()
getMarganlizeLemmas in class Modelpublic boolean getLemmaUseMorph()