assertEquals(2, content.split("<\\/body>").length);
}
@Test
public void testOutlookHTMLfromRTF() throws Exception {
Parser parser = new AutoDetectParser();
Metadata metadata = new Metadata();
// Check the HTML version
StringWriter sw = new StringWriter();
SAXTransformerFactory factory = (SAXTransformerFactory)
SAXTransformerFactory.newInstance();
TransformerHandler handler = factory.newTransformerHandler();
handler.getTransformer().setOutputProperty(OutputKeys.METHOD, "xml");
handler.getTransformer().setOutputProperty(OutputKeys.INDENT, "yes");
handler.setResult(new StreamResult(sw));
InputStream stream = OutlookParserTest.class.getResourceAsStream(
"/test-documents/test-outlook2003.msg");
try {
parser.parse(stream, handler, metadata, new ParseContext());
} finally {
stream.close();
}
// As the HTML version should have been processed, ensure