public class MergeBrillLexicon
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
protected static java.lang.String |
lemmaSeparator
Lemma separator character.
|
protected static Lemmatizer |
lemmatizer
Lemmatizer.
|
protected static PartOfSpeechTags |
partOfSpeechTags
Part of speech tags.
|
protected static WordTokenizer |
spellingTokenizer
Spelling tokenizer.
|
Modifier | Constructor and Description |
---|---|
protected |
MergeBrillLexicon()
Allow overrides but not instantiation.
|
Modifier and Type | Method and Description |
---|---|
static java.lang.String |
getLemma(java.lang.String spelling,
java.lang.String partOfSpeech)
Get lemma for a word.
|
static void |
main(java.lang.String[] args)
Main program.
|
static void |
mergeBrillLexicon(java.lang.String lexiconFileName,
java.lang.String brillLexiconFileName,
java.lang.String mergedLexiconFileName)
Merge Brill lexicon.
|
protected static WordTokenizer spellingTokenizer
protected static Lemmatizer lemmatizer
protected static PartOfSpeechTags partOfSpeechTags
protected static java.lang.String lemmaSeparator
protected MergeBrillLexicon()
public static void mergeBrillLexicon(java.lang.String lexiconFileName, java.lang.String brillLexiconFileName, java.lang.String mergedLexiconFileName) throws java.io.IOException
lexiconFileName
- MorphAdorner lexicon file name.brillLexiconFileName
- Brill format lexicon file name.mergedLexiconFileName
- Merged lexicon file name.java.io.IOException
public static java.lang.String getLemma(java.lang.String spelling, java.lang.String partOfSpeech)
spelling
- The word spelling.partOfSpeech
- The part of speech tag.public static void main(java.lang.String[] args)