Package org.htmlparser.filters

Examples of org.htmlparser.filters.TagNameFilter


      tag = conf.get("Cloud9.TargetTag");

      if (tag.equalsIgnoreCase("heading")) {
        filter = new HeadingTagFilter();
      } else {
        filter = new TagNameFilter(tag);
      }
    }
View Full Code Here


                        break;
                    case NAME:
                        if ("*".equals (token))
                            ret = new YesFilter ();
                        else if (ret == null)
                            ret = new TagNameFilter (unescape (token));
                        else
                            ret = new AndFilter (ret, new TagNameFilter (
                                unescape (token)));
                        nextToken ();
                        break;
                    case DELIM:
                        switch (token.charAt (0))
View Full Code Here

     
      par.reset();
      _links.clear();
     
      NodeFilter filter = new OrFilter( new NodeFilter[] {
          new TagNameFilter("A"),
          new TagNameFilter("META")
          }
      );
      NodeList list = par.parse( filter );
      System.out.println("Url: " + _url.toString() + " found " + list.size() + " items.");
      LinkTag lt = null;
View Full Code Here

      // *****************************************
      // Iterate images from HTML and replace CIDs

      NodeList oCollectionList = new NodeList();
      TagNameFilter oImgFilter = new TagNameFilter ("IMG");
      for (NodeIterator e = oPrsr.elements(); e.hasMoreNodes();)
        e.nextNode().collectInto(oCollectionList, oImgFilter);

      final int nImgs = oCollectionList.size();

View Full Code Here

            worker.setCaptureResources ((Boolean.valueOf (args[2]).booleanValue ()));
        worker.setFilter (
            new NotFilter (
                new OrFilter (
                    new AndFilter (
                        new TagNameFilter ("DIV"),
                        new HasAttributeFilter ("id", "navbar")),
                    new OrFilter (
                        new AndFilter (
                            new TagNameFilter ("DIV"),
                            new HasAttributeFilter ("id", "actionbar")),
                        new AndFilter (
                            new TagNameFilter ("DIV"),
                            new HasAttributeFilter ("id", "xhtml-validator"))))));
        worker.capture ();
       
        System.exit (0);
    }
View Full Code Here

        "<td><a href=\"nishi-hongwanji-lodging.html\"><img height=99 width=124 src=\"nishi-hongwanji-lodging-thumb.jpg\" border=0 ></a></td>\n"+
        "</tr></table></div>\n"+
        "</body>\n"+
        "</html>");
        NodeList collectionList = new NodeList();
        TagNameFilter filter = new TagNameFilter ("IMG");
        for (NodeIterator e = parser.elements();e.hasMoreNodes();)
            e.nextNode().collectInto(collectionList,filter);
        assertEquals("Size of collection vector should be 5",5,collectionList.size());
        // All items in collection vector should be links
        for (SimpleNodeIterator e = collectionList.elements();e.hasMoreNodes();) {
View Full Code Here

    /**
     * Create a wrapper over a new TagNameFilter.
     */
    public TagNameFilterWrapper ()
    {
        mFilter = new TagNameFilter ();

        // add the tag name choice
        mName = new JComboBox ();
        mName.setEditable (true);
        add (mName);
View Full Code Here

     * Get the underlying node filter object.
     * @return The node filter object suitable for serialization.
     */
    public NodeFilter getNodeFilter ()
    {
        TagNameFilter ret;
       
        ret = new TagNameFilter ();
        ret.setName (mFilter.getName ());
           
        return (ret);
    }
View Full Code Here

        else
            try
            {
                parser = new Parser ();
                if (1 < args.length)
                    filter = new TagNameFilter (args[1]);
                else
                {
                    filter = null;
                    // for a simple dump, use more verbose settings
                    parser.setFeedback (Parser.STDOUT);
View Full Code Here

    private static NodeList getLinks (String output, String tag, boolean recursive)
        throws ParserException, UnsupportedEncodingException
    {
       
        Parser parser = new Parser();
        NodeFilter filterLink = new TagNameFilter (tag);
        NodeList links = new NodeList ();
        parser = createParserParsingAnInputString(output);
        links = parser.extractAllNodesThatMatch(filterLink);

        // loop to remove tags added recursively
View Full Code Here

TOP

Related Classes of org.htmlparser.filters.TagNameFilter

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.