@Test
public void testLuceneStandardTokenizer() throws Exception {
String[] gold = {"I", "can't", "beleive", "that", "the", "Carolina", "Hurricanes", "won", "the", "2005", "2006", "Stanley", "Cup",};
StandardTokenizer tokenizer = new StandardTokenizer(Version.LUCENE_36, new StringReader("I can't beleive that the Carolina Hurricanes won the 2005-2006 Stanley Cup."));
List<String> result = new ArrayList<String>();
while (tokenizer.incrementToken()) {
result.add(((CharTermAttribute) tokenizer.getAttribute(CharTermAttribute.class)).toString());
}
assertTrue("result Size: " + result.size() + " is not: " + gold.length, result.size() == gold.length);
int i = 0;
for (String chunk : result) {