public class NGram
extends java.lang.Object
Modifier and Type | Field and Description |
---|---|
(package private) static java.lang.String[] |
CJK_CLASS
CJK Kanji Normalization Mapping
|
static java.util.HashMap<java.lang.Character,java.lang.Character> |
cjk_map |
static int |
N_GRAM |
Constructor and Description |
---|
NGram()
Constructor.
|
Modifier and Type | Method and Description |
---|---|
void |
addChar(char ch)
Append a character into ngram buffer.
|
java.lang.String |
get(int n)
Get n-Gram
|
static java.lang.String |
normalize_vi(java.lang.String text)
Normalizer for Vietnamese.
|
static char |
normalize(char ch)
Character Normalization
|
public static final int N_GRAM
public static java.util.HashMap<java.lang.Character,java.lang.Character> cjk_map
static final java.lang.String[] CJK_CLASS
public void addChar(char ch)
ch
- public java.lang.String get(int n)
n
- length of n-grampublic static char normalize(char ch)
ch
- public static java.lang.String normalize_vi(java.lang.String text)
text
-