**/
public class HtmlSimhash {
private static final Logger LOG = Logger.getLogger( HtmlSimhash.class );
public static void main( String[] args ) {
Tap inputTap = new Hfs( new TextDelimited(
new Fields("docid", "body"), " " ),
args[0] );
Tap outputTap = new StdoutTap();
// create the flow