|
||||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||||
java.lang.Objectde.folt.models.documentmodel.xliff.XliffTokenizer
public class XliffTokenizer
This class tokenizes xliff source, seg-source or target elements into word list Actually it can tokenize any Element. The tokenizer works language independent.
| Constructor Summary | |
|---|---|
XliffTokenizer()
|
|
XliffTokenizer(XliffDocument xliffDocument)
|
|
XliffTokenizer(XliffDocument xliffDocument,
java.lang.String language)
|
|
XliffTokenizer(XliffDocument xliffDocument,
java.lang.String language,
WordHandling wordHandling)
|
|
XliffTokenizer(XliffDocument xliffDocument,
WordHandling wordHandling)
|
|
| Method Summary | |
|---|---|
java.lang.String |
getLanguage()
|
WordHandling |
getWordHandling()
|
XliffDocument |
getXliffDocument()
|
static void |
main(java.lang.String[] args)
|
java.lang.String |
markUpTokens(java.util.Vector<java.lang.String> tokens)
Constructs a string from the tokens and marks them up |
java.util.Vector<java.lang.String> |
removeElement(java.util.Vector<java.lang.String> tokens,
java.lang.String element)
|
java.util.Vector<java.lang.String> |
removeInString(java.util.Vector<java.lang.String> tokens,
java.lang.String string)
|
java.util.Vector<java.lang.String> |
removeMrkTokens(java.util.Vector<java.lang.String> tokens)
remove mrk word/stop tokens from vector |
java.util.Vector<java.lang.String> |
removeString(java.util.Vector<java.lang.String> tokens,
java.lang.String string)
|
void |
setLanguage(java.lang.String language)
|
void |
setWordHandling(WordHandling wordHandling)
|
void |
setXliffDocument(XliffDocument xliffDocument)
|
static void |
test(java.lang.String[] args)
test simple test method for generating DataModelInstances |
org.jdom.Element |
tokenize(org.jdom.Element element)
Tokenize an xliff Element |
java.util.Vector<java.lang.String> |
tokenize(java.lang.String string)
|
java.util.Vector<java.lang.String> |
tokenize(java.lang.String string,
java.lang.String language)
Tokenize a string |
java.util.Vector<java.lang.String> |
tokenizeToVector(org.jdom.Element element)
|
java.util.Vector<java.lang.String> |
tokenizeToVector(org.jdom.Element element,
java.lang.String language)
Tokenize an element to a vector |
java.util.Vector<java.lang.String> |
tokenizeToVector(java.lang.String string)
|
java.util.Vector<java.lang.String> |
tokenizeToVector(java.lang.String string,
java.lang.String language)
|
| Methods inherited from class java.lang.Object |
|---|
equals, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
| Constructor Detail |
|---|
public XliffTokenizer()
public XliffTokenizer(XliffDocument xliffDocument)
xliffDocument -
public XliffTokenizer(XliffDocument xliffDocument,
java.lang.String language)
public XliffTokenizer(XliffDocument xliffDocument,
java.lang.String language,
WordHandling wordHandling)
public XliffTokenizer(XliffDocument xliffDocument,
WordHandling wordHandling)
| Method Detail |
|---|
public static void main(java.lang.String[] args)
args - public static void test(java.lang.String[] args)
public java.lang.String getLanguage()
public WordHandling getWordHandling()
public XliffDocument getXliffDocument()
public java.lang.String markUpTokens(java.util.Vector<java.lang.String> tokens)
tokens - the vector of tokens
public java.util.Vector<java.lang.String> removeElement(java.util.Vector<java.lang.String> tokens,
java.lang.String element)
tokens - element -
public java.util.Vector<java.lang.String> removeInString(java.util.Vector<java.lang.String> tokens,
java.lang.String string)
tokens - string -
public java.util.Vector<java.lang.String> removeMrkTokens(java.util.Vector<java.lang.String> tokens)
tokens - the tokens where to remove word and stop tokens
public java.util.Vector<java.lang.String> removeString(java.util.Vector<java.lang.String> tokens,
java.lang.String string)
tokens - string -
public void setLanguage(java.lang.String language)
public void setWordHandling(WordHandling wordHandling)
public void setXliffDocument(XliffDocument xliffDocument)
xliffDocument - public org.jdom.Element tokenize(org.jdom.Element element)
element -
public java.util.Vector<java.lang.String> tokenize(java.lang.String string)
string -
public java.util.Vector<java.lang.String> tokenize(java.lang.String string,
java.lang.String language)
string -
public java.util.Vector<java.lang.String> tokenizeToVector(org.jdom.Element element)
public java.util.Vector<java.lang.String> tokenizeToVector(org.jdom.Element element,
java.lang.String language)
element -
public java.util.Vector<java.lang.String> tokenizeToVector(java.lang.String string)
string -
public java.util.Vector<java.lang.String> tokenizeToVector(java.lang.String string,
java.lang.String language)
string - language -
|
||||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | |||||||||