public void testIt() throws ProtocolException, ParseException, IOException {
String urlString;
Parse parse;
Configuration conf = NutchConfiguration.create();
MimeUtil mimeutil = new MimeUtil(conf);
urlString = "file:" + sampleDir + fileSeparator + rtfFile;
File file = new File(sampleDir + fileSeparator + rtfFile);
byte[] bytes = new byte[(int) file.length()];
DataInputStream in = new DataInputStream(new FileInputStream(file));
in.readFully(bytes);
in.close();
WebPage page = new WebPage();
page.setBaseUrl(new Utf8(urlString));
page.setContent(ByteBuffer.wrap(bytes));
String mtype = mimeutil.getMimeType(file);
page.setContentType(new Utf8(mtype));
parse = new ParseUtil(conf).parse(urlString, page);
String title = parse.getTitle();