* @throws Exception DOCUMENT ME!
*/
public Document getDocument(File file, File htdocsDumpDir) throws Exception {
Document document = super.getDocument(file, htdocsDumpDir);
HTMLParser parser = HTMLParserFactory.newInstance(file);
parser.parse(file);
document.add(Field.Text("title", parser.getTitle()));
document.add(Field.Text("keywords", parser.getKeywords()));
document.add(Field.Text("contents", parser.getReader()));
return document;
}