Package org.htmlcleaner

Examples of org.htmlcleaner.CleanerProperties


        xml = CommonUtil.toXml((Node)node, keepHeader);
        return CommonUtil.toHTML(xml);
      }else if (node instanceof TagNode){
        StringWriter sw = new StringWriter();
        //TODO 从配置文件里加载这个CleanerProperties
        CleanerProperties prop = new HtmlCleaner().getProperties();
        SimpleXmlSerializer ser = new SimpleXmlSerializer(prop);
        ser.write((TagNode)node, sw, "UTF-8");
          String html = sw.getBuffer().toString();
          if (keepHeader)
            xml = html;
View Full Code Here


    StringBuffer sbResult = new StringBuffer();
    try
    {
      HtmlCleaner cleaner = new HtmlCleaner();
     
      CleanerProperties props = cleaner.getProperties();
      props.setUseEmptyElementTags(false);
     
      TagNode node = cleaner.clean(sb.toString());
      Document myJDom = new JDomSerializer(props, true).createJDom(node);
      XMLOutputter outputter = new XMLOutputter(Format.getPrettyFormat());
      sbResult.append(outputter.outputString(myJDom));
View Full Code Here

    this.html = html;

    // create an instance of HtmlCleaner
    cleaner = new HtmlCleaner();
    // take default cleaner properties
    CleanerProperties props = cleaner.getProperties();

    // customize cleaner's behaviour with property setters
    // props.setXXX(...);
    props.setOmitXmlDeclaration(true);
    props.setOmitHtmlEnvelope(true);

    // Clean HTML taken from simple string, file, URL, input stream,
    // input source or reader. Result is root node of created
    // tree-like structure. Single cleaner instance may be safely used
    // multiple times.
View Full Code Here

    this.url = url;

    // create an instance of HtmlCleaner
    cleaner = new HtmlCleaner();
    // take default cleaner properties
    CleanerProperties props = cleaner.getProperties();

    // customize cleaner's behaviour with property setters
    // props.setXXX(...);
    props.setOmitXmlDeclaration(true);
    props.setOmitHtmlEnvelope(true);

    // Clean HTML taken from simple string, file, URL, input stream,
    // input source or reader. Result is root node of created
    // tree-like structure. Single cleaner instance may be safely used
    // multiple times.
View Full Code Here

  {
    // serialize a node to a file, output stream, DOM, JDom...
    System.out.println( "\n\n\nINICIO");

    HtmlCleaner cleaner = new HtmlCleaner();
    CleanerProperties props = cleaner.getProperties();
    PrettyXmlSerializer serializer = new PrettyXmlSerializer( props);
 
    for( int i=0 ; i<nodes.length ; i++) {
      System.out.println( "######################## Va uno " + i);
View Full Code Here

     
      // create an instance of HtmlCleaner
    HtmlCleaner cleaner = new HtmlCleaner();

    // take default cleaner properties
    CleanerProperties props = cleaner.getProperties();

    // customize cleaner's behaviour with property setters
//    props.setXXX(...);

    // Clean HTML taken from simple string, file, URL, input stream,
View Full Code Here

     
      // create an instance of HtmlCleaner
    HtmlCleaner cleaner = new HtmlCleaner();

    // take default cleaner properties
    CleanerProperties props = cleaner.getProperties();

    // customize cleaner's behaviour with property setters
//    props.setXXX(...);

    // Clean HTML taken from simple string, file, URL, input stream,
View Full Code Here

    {
        // 1. get ally
      String page = HttpServer.getHttpServer().httpGetPage( "http://s3.travian.net/allianz.php?aid=" + ally.getId());
       
        HtmlCleaner cleaner = new HtmlCleaner();
        CleanerProperties props = cleaner.getProperties();
        props.setRecognizeUnicodeChars( true);
//        TagNode node = cleaner.clean( new File("tests/ally.html"));
        TagNode node = cleaner.clean( page);

        updatePlayers( ally, node);
      
View Full Code Here

        // 1. get overview/innerview pantalla actual
      String page = HttpServer.getHttpServer().httpGetPage( "http://s3.travian.net/spieler.php?uid=" + player.getId());
      Thread.sleep( (long) (1000 + 3000*Math.random()));

        HtmlCleaner cleaner = new HtmlCleaner();
        CleanerProperties props = cleaner.getProperties();
        props.setRecognizeUnicodeChars( true);
//        TagNode node = cleaner.clean( new File("tests/perfil.html"));
        TagNode node = cleaner.clean( page);

        updateMapVillages2( player, node);

View Full Code Here

  {
    // 1. get overview/innerview pantalla actual
//    String page = HttpServer.getHttpServer().httpGetPage( "http://s3.travian.net/dorf1.php");
     
    HtmlCleaner cleaner = new HtmlCleaner();
    CleanerProperties props = cleaner.getProperties();
    props.setRecognizeUnicodeChars( true);
        TagNode node = cleaner.clean( new File("tests/overview8.html"));
//        TagNode node = cleaner.clean( page);

        updateVillages2( villages, node);
View Full Code Here

TOP

Related Classes of org.htmlcleaner.CleanerProperties

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.