public class Document
extends java.lang.Object
implements java.io.Serializable
| Modifier and Type | Field and Description |
|---|---|
protected Dictionary |
dictionary
Internal dictionary that links terms to their numerical representation
|
| Constructor and Description |
|---|
Document(java.lang.String[] text,
java.util.Locale language) |
Document(java.lang.String[] text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates) |
Document(java.lang.String[] text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates,
int nGrams) |
Document(java.lang.String text,
java.util.Locale language) |
Document(java.lang.String text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates) |
Document(java.lang.String text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates,
int nGrams) |
| Modifier and Type | Method and Description |
|---|---|
boolean |
fragmentExists(int i) |
java.util.List<java.lang.String> |
get(RepresentationType representation) |
Fragment |
getFragment(int i) |
java.util.Map<java.lang.String,java.lang.Double> |
getNormalized(RepresentationType representation) |
java.lang.String |
getText() |
java.util.Map<java.lang.String,java.lang.Double> |
getWeighted(RepresentationType representation) |
int |
length() |
void |
setLanguage(java.util.Locale language) |
protected java.util.List<java.lang.String> |
splitText(java.lang.String text) |
protected final Dictionary dictionary
public Document(java.lang.String text,
java.util.Locale language)
public Document(java.lang.String[] text,
java.util.Locale language)
public Document(java.lang.String text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates)
public Document(java.lang.String[] text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates)
public Document(java.lang.String text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates,
int nGrams)
public Document(java.lang.String[] text,
java.util.Locale language,
boolean includeBow,
boolean includeCharNgrams,
boolean includeWordNgrams,
boolean includePseudoCognates,
int nGrams)
public boolean fragmentExists(int i)
public void setLanguage(java.util.Locale language)
public Fragment getFragment(int i)
i - public java.util.List<java.lang.String> get(RepresentationType representation)
public java.util.Map<java.lang.String,java.lang.Double> getWeighted(RepresentationType representation)
public java.util.Map<java.lang.String,java.lang.Double> getNormalized(RepresentationType representation)
public java.lang.String getText()
public int length()
protected java.util.List<java.lang.String> splitText(java.lang.String text)
text -