TokenStream result = new StandardTokenizer(reader); // splits at ". ", etc.
// result = new SysoFilter(result);
result = new WordSplitTokenizer(result); // non-alphanumerics
result = new DotSplitTokenizer(result); // all.package.names, hyphen-separated-words
result = new CamelCaseTokenizer(result); // CamelCaseIdentifiers
result = new LengthFilter(result, minWordLength, 128);
result = new LowerCaseFilter(result);