*
* @param html
* @return
*/
public static String removeUnSafeTag(String html) {
SishuokWhitelist whitelist = new SishuokWhitelist();
whitelist.addTags("embed", "object", "param", "span", "div", "img", "font", "del");
whitelist.addTags("a", "b", "blockquote", "br", "caption", "cite", "code", "col", "colgroup");
whitelist.addTags("dd", "dl", "dt", "em", "hr", "h1", "h2", "h3", "h4", "h5", "h6", "i", "img");
whitelist.addTags("li", "ol", "p", "pre", "q", "small", "strike", "strong", "sub", "sup", "table");
whitelist.addTags("tbody", "td", "tfoot", "th", "thead", "tr", "u", "ul");
//删除以on开头的(事件)
whitelist.addAttributes(":all", "on");
Document dirty = Jsoup.parseBodyFragment(html, "");
SishuokCleaner cleaner = new SishuokCleaner(whitelist);
Document clean = cleaner.clean(dirty);
return clean.body().html();