Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
N_GRAM |
3 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
STR_ADORN_EXISTING_XML_FILES |
"xml.adorn_existing_xml_files" |
protected static final java.lang.String |
STR_CLOSE_SENTENCE_AT_END_OF_HARD_TAG |
"xml.close_sentence_at_end_of_hard_tag" |
protected static final java.lang.String |
STR_CLOSE_SENTENCE_AT_END_OF_JUMP_TAG |
"xml.close_sentence_at_end_of_jump_tag" |
protected static final java.lang.String |
STR_CONTEXT_RULES |
"partofspeechtagger.context_rules" |
protected static final java.lang.String |
STR_DISALLOW_WORD_ELEMENTS_IN |
"xml.disallow_word_elements_in" |
protected static final java.lang.String |
STR_DOCTYPE_NAME |
"xml.doctype.name" |
protected static final java.lang.String |
STR_DOCTYPE_SYSTEM |
"xml.doctype.system" |
protected static final java.lang.String |
STR_ENTITIES_MERGE |
"xml.entities_merge" |
protected static final java.lang.String |
STR_ENTITIES_NOT_FILES |
"xml.entities_not_files" |
protected static final java.lang.String |
STR_ENTITIES_TREAT_ALL |
"xml.entities_treat_all" |
protected static final java.lang.String |
STR_FIELD_DELIMITERS |
"xml.field_delimiters" |
protected static final java.lang.String |
STR_FIX_GAP_TAGS |
"xml.fix_gap_tags" |
protected static final java.lang.String |
STR_FIX_ORIG_TAGS |
"xml.fix_orig_tags" |
protected static final java.lang.String |
STR_FIX_SPLIT_WORDS |
"xml.fix_split_words" |
protected static final java.lang.String |
STR_ID |
"xml.id.attribute" |
protected static final java.lang.String |
STR_ID_SPACING |
"xml.id.spacing" |
protected static final java.lang.String |
STR_ID_TYPE |
"xml.id.type" |
protected static final java.lang.String |
STR_IGNORE_TAG_CASE |
"xml.ignore_tag_case" |
protected static final java.lang.String |
STR_JUMP_TAGS |
"xml.jump_tags" |
protected static final java.lang.String |
STR_LEXICAL_RULES |
"partofspeechtagger.lexical_rules" |
protected static final java.lang.String |
STR_LOG |
"xml.log" |
protected static final java.lang.String |
STR_OUTPUT_FILE |
"xml.output_file" |
protected static final java.lang.String |
STR_OUTPUT_NONREDUNDANT_ATTRIBUTES_ONLY |
"xml.output_nonredundant_attributes_only" |
protected static final java.lang.String |
STR_OUTPUT_NONREDUNDANT_EOS_ATTRIBUTE |
"xml.output_nonredundant_eos_attribute" |
protected static final java.lang.String |
STR_OUTPUT_NONREDUNDANT_PART_ATTRIBUTE |
"xml.output_nonredundant_part_attribute" |
protected static final java.lang.String |
STR_OUTPUT_NONREDUNDANT_TOKEN_ATTRIBUTE |
"xml.output_nonredundant_token_attribute" |
protected static final java.lang.String |
STR_OUTPUT_PSEUDO_PAGE_BOUNDARY_MILESTONES |
"xml.output_pseudo_page_boundary_milestones" |
protected static final java.lang.String |
STR_OUTPUT_SENTENCE_BOUNDARY_MILESTONES |
"xml.output_sentence_boundary_milestones" |
protected static final java.lang.String |
STR_OUTPUT_WHITESPACE_ELEMENTS |
"xml.output_whitespace_elements" |
protected static final java.lang.String |
STR_PSEUDO_PAGE_CONTAINER_DIV_TYPES |
"xml.pseudo_page_container_div_types" |
protected static final java.lang.String |
STR_PSEUDO_PAGE_SIZE |
"xml.pseudo_page_size" |
protected static final java.lang.String |
STR_PUNC_TAG_NAME |
"xml.punc_tag_name" |
protected static final java.lang.String |
STR_RELATIVE_URI_BASE |
"xml.relative_uri_base" |
protected static final java.lang.String |
STR_REPEAT_ATTRIBUTES |
"xml.repeat_attributes" |
protected static final java.lang.String |
STR_SOFT_TAGS |
"xml.soft_tags" |
protected static final java.lang.String |
STR_SPECIAL_SEPARATOR |
"xml.special_separator" |
protected static final java.lang.String |
STR_SPELLING_PAIRS |
"spelling.spelling_pairs" |
protected static final java.lang.String |
STR_SPELLING_PAIRS_BY_WORD_CLASS |
"spelling.spelling_pairs_by_word_class" |
protected static final java.lang.String |
STR_STANDARD_SPELLINGS |
"spelling.standard_spellings" |
protected static final java.lang.String |
STR_SUFFIX_LEXICON |
"lexicon.suffix_lexicon" |
protected static final java.lang.String |
STR_SURROUND_MARKER |
"xml.surround_marker" |
protected static final java.lang.String |
STR_TAGS_PATH |
"xml.tags_path" |
protected static final java.lang.String |
STR_TOKENLABEL_ATTRIBUTE |
"xml.tokenlabel.attribute" |
protected static final java.lang.String |
STR_TOKENLABEL_EMIT |
"xml.tokenlabel.emit" |
protected static final java.lang.String |
STR_TOKENLABEL_PREPENDWORKNAME |
"xml.tokenlabel.prependworkname" |
protected static final java.lang.String |
STR_TOKENLABEL_SPACING |
"xml.tokenlabel.spacing" |
protected static final java.lang.String |
STR_TRANSITION_MATRIX |
"partofspeechtagger.transition_matrix" |
protected static final java.lang.String |
STR_USE_PC_TO_MARK_END_OF_SENTENCE |
"xml.use_pc_to_mark_end_of_sentence" |
protected static final java.lang.String |
STR_WORD_DELIMITERS |
"xml.word_delimiters" |
protected static final java.lang.String |
STR_WORD_FIELD |
"xml.word_field" |
protected static final java.lang.String |
STR_WORD_LEXICON |
"lexicon.word_lexicon" |
protected static final java.lang.String |
STR_WORD_PATH |
"xml.word_path" |
protected static final java.lang.String |
STR_WORD_TAG_NAME |
"xml.word_tag_name" |
protected static final java.lang.String |
STR_XMLSCHEMA |
"xml.xml_schema" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
ATTRS |
2 |
public static final int |
IDLEFT |
1 |
public static final int |
IDRIGHT |
3 |
public static final int |
IDVALUE |
2 |
public static final int |
LEFT |
1 |
public static final int |
PATHLEFT |
1 |
public static final int |
PATHRIGHT |
3 |
public static final int |
PATHVALUE |
2 |
public static final int |
RIGHT |
4 |
public static final int |
WORD |
3 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
defaultAbbreviationsFileName |
"resources/en-abbrevs.properties" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
defaultAposTokensFileName |
"resources/en-apostokens.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
doublingVerbsPath |
"resources/doublingverbs.txt" |
protected static final java.lang.String |
irregularVerbsPath |
"resources/irregularverbs.txt" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
POSTFIX_ADJECTIVE_REGEX |
"((?!major|lieutenant|brigadier|adjutant)\\S+(?=(?:-|\\s+)general)|court(?=(?:-|\\s+)martial))(.*)" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final char |
letterGapChar |
9679 |
protected static final java.lang.String |
letterGapString |
"\u25cf" |
protected static final char |
spanGapChar |
8230 |
protected static final java.lang.String |
spanGapString |
"\u2026" |
protected static final char |
wordGapChar |
9674 |
protected static final java.lang.String |
wordGapString |
"\u25ca" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected final java.lang.String |
teiHeaderPattern |
"tei|tei\\.2|TEI|TEI\\.2" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
LEFT |
0 |
public static final int |
RIGHT |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
defaultSuffixLexiconPath |
"resources/nupossuffix.lex" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
defaultLexiconPath |
"resources/nupos.lex" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
pennTreebankSuffixLexiconPath |
"resources/pennsuffix.lex" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
pennTreebankLexiconPath |
"resources/penn.lex" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
nuposResourcePath |
"resources/nupostags.properties" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
ADJECTIVE |
"adjective" |
public static final java.lang.String |
ADVERB |
"adverb" |
public static final java.lang.String |
CARDINAL_NUMERAL |
"numeral-cardinal" |
public static final int |
DESCRIPTION_INDEX |
4 |
public static final java.lang.String |
ENGLISH_WORD |
"foreign-english" |
public static final java.lang.String |
FOREIGN_WORD |
"foreign-word" |
public static final java.lang.String |
FRENCH_WORD |
"foreign-french" |
public static final int |
GENERAL_TAG_NAME_INDEX |
3 |
public static final java.lang.String |
GERMAN_WORD |
"foreign-german" |
public static final java.lang.String |
GREEK_WORD |
"foreign-greek" |
public static final java.lang.String |
HEBREW_WORD |
"foreign-hebrew" |
public static final java.lang.String |
INTERJECTION |
"interjection" |
public static final java.lang.String |
ITALIAN_WORD |
"foreign-italian" |
public static final java.lang.String |
LATIN_WORD |
"foreign-latin" |
public static final int |
MAJOR_WORDCLASS_INDEX |
2 |
public static final java.lang.String |
NONE |
"none" |
public static final java.lang.String |
ORDINAL_NUMERAL |
"numeral-ordinal" |
public static final java.lang.String |
PLURAL_NOUN |
"noun-plural" |
public static final java.lang.String |
PLURAL_PROPER_NOUN |
"noun-proper-plural" |
public static final java.lang.String |
POSSESSIVE_NOUN |
"noun-possessive" |
public static final java.lang.String |
POSSESSIVE_PLURAL_NOUN |
"noun-plural-possessive" |
public static final java.lang.String |
POSSESSIVE_PLURAL_PROPER_NOUN |
"noun-proper-plural-possessive" |
public static final java.lang.String |
POSSESSIVE_SINGULAR_NOUN |
"noun-singular-possessive" |
public static final java.lang.String |
POSSESSIVE_SINGULAR_PROPER_NOUN |
"noun-proper-singular-possessive" |
public static final java.lang.String |
PROPER_NOUN |
"noun-proper" |
public static final java.lang.String |
PUNCTUATION |
"punctuation" |
public static final java.lang.String |
SINGULAR_NOUN |
"noun-singular" |
public static final java.lang.String |
SINGULAR_PROPER_NOUN |
"noun-proper-singular" |
public static final java.lang.String |
SPANISH_WORD |
"foreign-spanish" |
public static final java.lang.String |
SYMBOL |
"symbol" |
public static final int |
TAG_INDEX |
0 |
public static final java.lang.String |
UNDETERMINED |
"undetermined" |
public static final java.lang.String |
VERB |
"verb" |
public static final java.lang.String |
VERB_PAST |
"verb-past" |
public static final java.lang.String |
VERB_PAST_PARTICIPLE |
"verb-past-participle" |
public static final java.lang.String |
VERB_PRESENT_PARTICIPLE |
"verb-present-participle" |
public static final int |
WORDCLASS_INDEX |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
pennTreebankResourcePath |
"resources/penntreebanktags.properties" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
MAXSOUNDEXLENGTH |
4 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
staart |
"STAART" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
transitionMatrixPath |
"resources/nupostransitionmatrix.mat" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
transitionMatrixPath |
"resources/penntreebanktransitionmatrix.mat" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
BIGRAM |
1 |
protected static final int |
TRIGRAM |
2 |
protected static final int |
UNIGRAM |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
LDQUOTESTR |
"\u201c" |
protected static final java.lang.String |
LSQUOTESTR |
"\u2018" |
protected static final java.lang.String |
RDQUOTESTR |
"\u201d" |
protected static final java.lang.String |
RSQUOTESTR |
"\u2019" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
disallowedSentenceStarters |
",%." |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
wordMapPath |
"resources/abbc.tab" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
wordMapPath |
"resources/abbc.tab" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
macronMapResourceName |
"resources/macronmap.tab" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DICE |
0 |
public static final int |
LOGLIKE |
1 |
public static final int |
PHISQUARED |
2 |
public static final int |
SCP |
4 |
public static final int |
SMI |
3 |
public static final int |
T |
5 |
public static final int |
Z |
6 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final char |
zeroDigit |
48 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INC |
50 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
DATABASE_DIRECTORY |
"wordnet.database.dir" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
alwaysSeparators |
"((-{2,})|(\\.{3,})|[\\(\\)\\[\\]\\{\\}\";:/=`\u00b6<>\u00a1\u00bf\u00ab\u00bb_\u201c\u201d\u2014\\|\u00a6\u2758[\\p{InGeneralPunctuation}&&[^\u2022\u2032\u2033\u2034\u2018\u2019\u2010\u2011]]\\p{InLetterlikeSymbols}\\p{InMathematicalOperators}\\p{InMiscellaneousTechnical}[\\p{InGeometricShapes}&&[^\u25cf]]\\p{InMiscellaneousSymbols}\\p{InDingbats}\\p{InAlphabeticPresentationForms}])" |
protected static final java.lang.String |
asterisks |
"([\\*]+)" |
protected static final java.lang.String |
commaSeparator |
"(,)([^0-9])" |
protected static final java.lang.String |
hyphens |
"(-{2,})" |
protected static final java.lang.String |
periods |
"(\\.{3,})" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
EccoAlwaysSeparators |
"((-{2,})|(\\.{3,})|[\\(\\)\\[\\]\";:/=`\u00b6<>\u00a1\u00bf\u00ab\u00bb\u201c\u201d\u00a6\u2758[\\p{InGeneralPunctuation}&&[^\\{\\}\\|\u2022\u2032\u2033\u2034\u2018\u2019\u2010\u2011\u2026\u2042\u2020\u2021\u00a7]]\\p{InLetterlikeSymbols}\\p{InMathematicalOperators}\\p{InMiscellaneousTechnical}[\\p{InGeometricShapes}&&[^\u25cf\u25ca]]\\p{InMiscellaneousSymbols}\\p{InDingbats}\\p{InAlphabeticPresentationForms}])" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
EEBOAlwaysSeparators |
"((-{2,})|(\\.{3,})|[\\(\\)\\[\\]\";:/=\u00b6<>\u201c\u201d\u2014\u00a6\u2758[\\p{InGeneralPunctuation}&&[^\\{\\}\\|\u2022\u2032\u2033\u2034\u2018\u2019\u2010\u2011\u2026]]\\p{InLetterlikeSymbols}\\p{InMathematicalOperators}\\p{InMiscellaneousTechnical}[\\p{InGeometricShapes}&&[^\u25cf\u25ca]]\\p{InMiscellaneousSymbols}\\p{InDingbats}\\p{InAlphabeticPresentationForms}])" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
BASE_SENTENCE_ANNOTATION_TYPE_PARAMETER_NAME |
"baseSentenceAnnotationType" |
public static final java.lang.String |
BASE_TOKEN_ANNOTATION_TYPE_PARAMETER_NAME |
"baseTokenAnnotationType" |
public static final java.lang.String |
TAG_DOCUMENT_PARAMETER_NAME |
"document" |
public static final java.lang.String |
TAG_INPUT_AS_PARAMETER_NAME |
"inputASName" |
public static final java.lang.String |
TAG_OUTPUT_AS_PARAMETER_NAME |
"outputASName" |
public static final java.lang.String |
TOKEN_LEMMA_FEATURE_NAME |
"lemma" |
public static final java.lang.String |
TOKEN_SPELLING_FEATURE_NAME |
"spelling" |
public static final java.lang.String |
TOKEN_STANDARD_SPELLING_FEATURE_NAME |
"standard" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final long |
serialVersionUID |
-1L |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
ATTRS |
2 |
protected static final int |
CDATA |
2 |
protected static final int |
CLEFT |
1 |
protected static final int |
CRIGHT |
3 |
protected static final int |
LEFT |
1 |
protected static final int |
MAXLINEWIDTH |
80 |
protected static final int |
RIGHT |
4 |
protected static final int |
WORD |
3 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
5 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
CHECKBOX |
7 |
protected static final int |
CORLEM |
5 |
protected static final int |
CORPOS |
6 |
protected static final int |
CORSPELL |
3 |
protected static final int |
SPELL |
2 |
protected static final int |
STANSPELL |
4 |
public static final int |
TABFIELDSCOUNT |
9 |
protected static final int |
UPDATEDID |
8 |
protected static final int |
WORDID |
1 |
protected static final int |
WORKID |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
DIVTYPE |
16 |
protected static final int |
INITPARAMS |
1 |
protected static final int |
LEMMA |
5 |
protected static final int |
PATH |
7 |
protected static final int |
POS |
6 |
protected static final int |
SPELLING |
2 |
protected static final int |
STANDARD |
4 |
protected static final int |
WORKID |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
apos |
"'" |
protected static final java.lang.String |
dq |
"\ue061" |
protected static final java.lang.String |
ldquo |
"“" |
protected static final java.lang.String |
lsquo |
"‘" |
protected static final java.lang.String |
rdquo |
"”" |
protected static final java.lang.String |
rsquo |
"’" |
protected static final java.lang.String |
sq |
"\ue060" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
ap |
"\ue062" |
protected static final java.lang.String |
apos |
"'" |
protected static final java.lang.String |
dq |
"\ue061" |
protected static final int |
INITPARAMS |
3 |
protected static final java.lang.String |
ldquo |
"“" |
protected static final java.lang.String |
lsquo |
"‘" |
protected static final java.lang.String |
rdquo |
"”" |
protected static final java.lang.String |
rsquo |
"’" |
protected static final java.lang.String |
sq |
"\ue060" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
1 |
protected static final java.lang.String |
teiHeaderPattern |
"tei|tei\\.2|TEI|TEI\\.2" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
CANDIDATE_1 |
1 |
protected static final int |
CANDIDATE_2 |
2 |
protected static final int |
START |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
5 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
INITPARAMS |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final char |
ASTERISM |
8258 |
public static final java.lang.String |
ASTERISM_STRING |
"\u2042" |
public static final char |
BLACKCIRCLE |
9679 |
public static final java.lang.String |
BLACKCIRCLE_STRING |
"\u25cf" |
public static final char |
BROKEN_VERTICAL_BAR |
166 |
public static final java.lang.String |
BROKEN_VERTICAL_BAR_STRING |
"\u00a6" |
public static final char |
CHAR_END_OF_TEXT_SECTION |
58624 |
public static final java.lang.String |
CHAR_END_OF_TEXT_SECTION_STRING |
"\ue500" |
public static final char |
CHAR_FAKE_SOFT_HYPHEN |
58625 |
public static final java.lang.String |
CHAR_FAKE_SOFT_HYPHEN_STRING |
"\ue501" |
public static final char |
CHAR_GAP_MARKER |
9679 |
public static final java.lang.String |
CHAR_GAP_MARKER_STRING |
"\u25cf" |
public static final char |
CHAR_SUBSTITUTE_SINGLE_QUOTE |
58626 |
public static final java.lang.String |
CHAR_SUBSTITUTE_SINGLE_QUOTE_STRING |
"\ue502" |
public static final char |
CHAR_SUP_TEXT_MARKER |
58627 |
public static final java.lang.String |
CHAR_SUP_TEXT_MARKER_STRING |
"\ue503" |
public static final char |
COMBINING_MACRON |
772 |
public static final java.lang.String |
COMBINING_MACRON_STRING |
"\u0304" |
public static final char |
DAGGER |
8224 |
public static final java.lang.String |
DAGGER_STRING |
"\u2020" |
public static final char |
DEGREES_MARK |
8242 |
public static final java.lang.String |
DEGREES_MARK_STRING |
"\u2032" |
public static final char |
DIVIDER_VERTICAL_BAR |
8739 |
public static final java.lang.String |
DIVIDER_VERTICAL_BAR_STRING |
"\u2223" |
public static final char |
DOTTEDCIRCLE |
9676 |
public static final java.lang.String |
DOTTEDCIRCLE_STRING |
"\u25cc" |
public static final char |
DOUBLE_DAGGER |
8225 |
public static final java.lang.String |
DOUBLE_DAGGER_STRING |
"\u2021" |
public static final char |
ELLIPSIS |
8230 |
public static final java.lang.String |
ELLIPSIS_STRING |
"\u2026" |
public static final char |
EURO_SIGN |
8364 |
public static final char |
INVISIBLE_SEPARATOR |
8291 |
public static final java.lang.String |
INVISIBLE_SEPARATOR_STRING |
"\u2063" |
public static final char |
LDQUOTE |
8220 |
public static final java.lang.String |
LDQUOTE_STRING |
"\u201c" |
public static final char |
LEFT_ANGLE_BRACKET |
12296 |
public static final java.lang.String |
LEFT_ANGLE_BRACKET_STRING |
"\u3008" |
public static final char |
LIGHT_VERTICAL_BAR |
10072 |
public static final java.lang.String |
LIGHT_VERTICAL_BAR_STRING |
"\u2758" |
public static final char |
LONG_DASH |
8212 |
public static final java.lang.String |
LONG_DASH_STRING |
"\u2014" |
public static final char |
LONG_S |
383 |
public static final java.lang.String |
LONG_S_STRING |
"\u017f" |
public static final char |
LOZENGE |
9674 |
public static final java.lang.String |
LOZENGE_STRING |
"\u25ca" |
public static final char |
LSQUOTE |
8216 |
public static final java.lang.String |
LSQUOTE_STRING |
"\u2018" |
public static final char |
MINUTES_MARK |
8243 |
public static final char |
NONBREAKING_BLANK |
160 |
public static final java.lang.String |
NONBREAKING_BLANK_STRING |
"\u00a0" |
public static final char |
NONBREAKING_HYPHEN |
8209 |
public static final java.lang.String |
NONBREAKING_HYPHEN_STRING |
"\u2011" |
public static final char |
OLD_EURO_SIGN |
8352 |
public static final char |
PARAGRAPH |
182 |
public static final java.lang.String |
PARAGRAPH_STRING |
"\u00b6" |
public static final char |
RDQUOTE |
8221 |
public static final java.lang.String |
RDQUOTE_STRING |
"\u201d" |
public static final char |
RIGHT_ANGLE_BRACKET |
12297 |
public static final java.lang.String |
RIGHT_ANGLE_BRACKET_STRING |
"\u3009" |
public static final char |
RLSQUOTE |
8218 |
public static final java.lang.String |
RLSQUOTE_STRING |
"\u201a" |
public static final char |
RSQUOTE |
8217 |
public static final java.lang.String |
RSQUOTE_STRING |
"\u2019" |
public static final char |
SECONDS_MARK |
8244 |
public static final char |
SECTION_SIGN |
167 |
public static final java.lang.String |
SECTION_SIGN_STRING |
"\u00a7" |
public static final char |
SHORT_DASH |
8208 |
public static final java.lang.String |
SHORT_DASH_STRING |
"\u2010" |
public static final char |
SOLAR_CIRCLE |
8857 |
public static final java.lang.String |
SOLAR_CIRCLE_STRING |
"\u2299" |
public static final char |
SOLIDCIRCLE |
8226 |
public static final java.lang.String |
SOLIDCIRCLE_STRING |
"\u2022" |
public static final java.lang.String |
SPAN_GAP_MARKER |
"\u3008\u2026\u3009" |
public static final char |
UNKNOWN_PUNC |
9642 |
public static final char |
VERTICAL_BAR |
124 |
public static final java.lang.String |
VERTICAL_BAR_STRING |
"|" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
MAX_ROMAN_NUMERAL |
5000 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
BITS |
64 |
protected static final int |
BITS_M1 |
63 |
protected static final int |
LG_BITS |
6 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final java.lang.String |
keyValueSeparators |
"=: \t\r\n\f" |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final char |
DEFAULT_QUALIFIER |
34 |
protected static final char |
DEFAULT_SEPARATOR |
44 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
DEBUG |
4 |
public static final int |
ERROR |
1 |
public static final int |
FATAL |
0 |
public static final int |
INFO |
3 |
public static final int |
WARN |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final java.lang.String |
DATE_TIME_FORMAT |
"yyyy-MM-dd hh:mm:ss,SSS" |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final double |
LN10INV |
0.4342944819032518 |
public static final double |
MAXLOG |
709.782712893384 |
public static final double |
MINLOG |
-745.1332191019412 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final double |
MAXGAM |
171.6243769563027 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
FALSEPOSITION |
1 |
public static final int |
ILLINOIS |
2 |
public static final int |
PLAIN |
0 |
Modifier and Type | Constant Field | Value |
---|---|---|
protected static final int |
MAXDIFFS |
2 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
AND_type |
1 |
public static final java.lang.String |
ANDABLE_CONNECTORS_WORD |
"ANDABLE-CONNECTORS" |
public static final int |
BAD_WORD |
251 |
public static final int |
BOTH_LABEL |
-7 |
public static final int |
BUILDEXPR |
6 |
public static final char |
CLOSE_BRACKET |
93 |
public static final int |
COMMA_LABEL |
-2 |
public static final char |
COMMENT_CHAR |
37 |
public static final int |
CONNECTOR_type |
2 |
public static final int |
CType_CLOSE |
1 |
public static final int |
CType_OPEN |
0 |
public static final int |
CType_WORD |
2 |
public static final java.lang.String |
DEFAULTPATH |
".:./data:./data/link:/home/liferay/linkgrammar:/home/liferay/linkgrammar/data:/home/liferay/linkgrammar/data/link" |
public static final int |
DICTPARSE |
2 |
public static final int |
DISPLAY_MAX |
1024 |
public static final int |
DOWN_priority |
2 |
public static final java.lang.String |
ED_WORD |
"ED-WORDS" |
public static final int |
EITHER_LABEL |
-3 |
public static final int |
GENTLE |
1 |
public static final int |
HT_SIZE |
1024 |
public static final java.lang.String |
HYPHENATED_WORD |
"HYPHENATED-WORDS" |
public static final java.lang.String |
ING_WORD |
"ING-WORDS" |
public static final int |
INTERNALERROR |
7 |
public static final java.lang.String |
LEFT_WALL_DISPLAY |
"LEFT-WALL" |
public static final java.lang.String |
LEFT_WALL_SUPPRESS |
"Wd" |
public static final java.lang.String |
LEFT_WALL_WORD |
"LEFT-WALL" |
public static final int |
LINE_LIMIT |
70 |
public static final int |
LINKSET_DEFAULT_SEED |
37 |
public static final int |
LINKSET_MAX_SETS |
512 |
public static final int |
LINKSET_SEED_VALUE |
37 |
public static final int |
LINKSET_SPARSENESS |
2 |
public static final java.lang.String |
LY_WORD |
"LY-WORDS" |
public static final int |
MAX_DISJUNCT_COST |
10000 |
public static final int |
MAX_HEIGHT |
30 |
public static final int |
MAX_LINE |
1500 |
public static final int |
MAX_LINKS |
497 |
public static final int |
MAX_PATH_NAME |
400 |
public static final int |
MAX_SENTENCE |
250 |
public static final int |
MAX_STRIP |
10 |
public static final int |
MAX_TOKEN_LENGTH |
50 |
public static final int |
MAX_WORD |
60 |
public static final int |
MAXCONSTITUENTS |
1024 |
public static final int |
MAXINPUT |
1024 |
public static final int |
MAXSUBL |
16 |
public static final int |
NEGATIVECOST |
-1000000 |
public static final int |
NEITHER_LABEL |
-4 |
public static final char |
NO_LABEL |
32 |
public static final int |
NO_WORD |
255 |
public static final int |
NOCUTOFF |
1000 |
public static final int |
NODICT |
1 |
public static final int |
NORMAL_LABEL |
-1 |
public static final int |
NOT_LABEL |
-5 |
public static final int |
NOTINDICT |
5 |
public static final int |
NOTONLY_LABEL |
-6 |
public static final java.lang.String |
NUMBER_WORD |
"NUMBERS" |
public static final char |
OPEN_BRACKET |
91 |
public static final int |
OR_type |
0 |
public static final char |
PARSE_WITH_DISJUNCT_COST_GT_0 |
58 |
public static final java.lang.String |
PL_PROPER_WORD |
"PL-CAPITALIZED-WORDS" |
public static final java.lang.String |
POSTPROCESS_WORD |
"POSTPROCESS" |
public static final int |
PP_FIRST_PASS |
1 |
public static final int |
PP_LEXER_MAX_LABELS |
512 |
public static final int |
PP_MAX_DOMAINS |
128 |
public static final int |
PP_MAX_UNIQUE_LINK_NAMES |
1024 |
public static final int |
PP_SECOND_PASS |
2 |
public static final java.lang.String |
PROPER_WORD |
"CAPITALIZED-WORDS" |
public static final java.lang.String |
RIGHT_WALL_DISPLAY |
"RIGHT-WALL" |
static final java.lang.String |
RIGHT_WALL_SUPPRESS |
"RW" |
public static final java.lang.String |
RIGHT_WALL_WORD |
"RIGHT-WALL" |
public static final int |
RTSIZE |
256 |
public static final int |
RUTHLESS |
0 |
public static final java.lang.String |
S_WORD |
"S-WORDS" |
public static final int |
SEPARATE |
4 |
public static final int |
SHORT_LEN |
6 |
public static final int |
THIN_priority |
0 |
public static final char |
UNGRAMMATICAL |
42 |
public static final java.lang.String |
UNKNOWN_WORD |
"UNKNOWN-WORD" |
public static final java.lang.String |
UNLIMITED_CONNECTORS_WORD |
"UNLIMITED-CONNECTORS" |
public static final int |
UNLIMITED_LEN |
255 |
public static final int |
UP_priority |
1 |
public static final int |
VDAL |
1 |
public static final int |
WORDFILE |
3 |
public static final int |
WType_NONE |
0 |
public static final int |
WType_PTYPE |
2 |
public static final int |
WType_QDTYPE |
4 |
public static final int |
WType_QTYPE |
3 |
public static final int |
WType_STYPE |
1 |
Modifier and Type | Constant Field | Value |
---|---|---|
public static final int |
CMS_SIZE |
2048 |