public void testWORDxtraction() throws Exception {
File file = getResourceAsFile("/test-documents/testWORD.doc");
String s1 = ParseUtils.getStringContent(file, tc);
String s2 = ParseUtils.getStringContent(file, tc, "application/msword");
assertEquals(s1, s2);
Parser parser = tc.getParser("application/msword");
Metadata metadata = new Metadata();
InputStream stream = new FileInputStream(file);
try {
parser.parse(stream, new DefaultHandler(), metadata);
} finally {
stream.close();
}
assertEquals("Sample Word Document", metadata.get(Metadata.TITLE));
}