// For example <xml><book><title>hello</title></book></xml> should not change the affect the title of the page.
State xml = new State();
html.addRule(new StateTransitionRule("xml", xml));
// Useful properties
html.addRule(new HtmlAttributesRule(page)); // attributes in <html> element
html.addRule(new MetaTagRule(page)); // all <meta> tags
html.addRule(new ParameterExtractingRule(page)); // <parameter> blocks
html.addRule(new ContentBlockExtractingRule(page)); // <content> blocks
// Capture properties written to documents by MS Office (author, version, company, etc).