"nicht", ",", "also", "muß", "sie", "sie", "sehen", ";", "und", "die", "sehe", "man", "einmal", "in", "einem",
"Paar", "spitzen", "Schultern", ",", "zylindrischen", "Schenkeln", ",", "oder", "leeren", "Ärmeln", ",",
"oder", "lattenförmigen", "Beinen", "."
};
TreebankLanguagePack tlp = new NegraPennLanguagePack();
Tokenizer<? extends HasWord> toke =tlp.getTokenizerFactory().getTokenizer(new StringReader(sample));
List<? extends HasWord> tokens = toke.tokenize();
List<? extends HasWord> goldTokens = Sentence.toWordList(tokenized);
assertEquals("Tokenization length mismatch", goldTokens.size(), tokens.size());
for (int i = 0, sz = goldTokens.size(); i < sz; i++) {
assertEquals("Bad tokenization", goldTokens.get(i).word(), tokens.get(i).word());