Package org.htmlparser.scanners

Examples of org.htmlparser.scanners.LinkScanner


  public void testBrokenLink() throws ParserException {
    createParser("<a href=\"faq.html\">" + "<br>\n" + "<img src=\"images/46revues.gif\" " + "width=\"100\" "
        + "height=\"46\" " + "border=\"0\" " + "alt=\"Rejoignez revues.org!\" " + "align=\"middle\">",
        "http://www.yahoo.com");
    // Register the image scanner
    parser.addScanner(new LinkScanner("-l"));

    parseAndAssertNodeCount(1);
    assertTrue("Node 0 should be a link tag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];
    assertNotNull(linkTag.toString());
View Full Code Here


  public void testLinkDataContents() throws ParserException {
    createParser(
        "<a href=\"http://transfer.go.com/cgi/atransfer.pl?goto=http://www.signs.movies.com&name=114332&srvc=nws&context=283&guid=4AD5723D-C802-4310-A388-0B24E1A79689\" target=\"_new\"><img src=\"http://ad.abcnews.com/ad/sponsors/buena_vista_pictures/bvpi-ban0003.gif\" width=468 height=60 border=\"0\" alt=\"See Signs in Theaters 8-2 - Starring Mel Gibson\" align=><font face=\"verdana,arial,helvetica\" SIZE=\"1\"><b></b></font></a>",
        "http://transfer.go.com");
    // Register the image scanner
    LinkScanner linkScanner = new LinkScanner("-l");
    parser.addScanner(linkScanner);
    parser.addScanner(linkScanner.createImageScanner("-i"));

    parseAndAssertNodeCount(1);
    assertTrue("Node 0 should be a link tag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];
    assertEquals(
View Full Code Here

  }

  public void testNotMailtoLink() throws ParserException {
    createParser("<A HREF=\"mailto.html\">not@for.real</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];

    assertEquals("Link Plain Text", "not@for.real", linkTag.toPlainTextString());
View Full Code Here

    assertTrue("Link is not a mail link", !linkTag.isMailLink());
  }

  public void testMailtoLink() throws ParserException {
    createParser("<A HREF=\"mailto:this@is.real\">this@is.real</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];
    assertEquals("Link Plain Text", "this@is.real", linkTag.toPlainTextString());
    assertTrue("Link is a mail link", linkTag.isMailLink());
View Full Code Here

    assertTrue("Link is a mail link", linkTag.isMailLink());
  }

  public void testJavascriptLink() throws ParserException {
    createParser("<A HREF=\"javascript:alert('hello');\">say hello</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];

    assertEquals("Link Plain Text", "say hello", linkTag.toPlainTextString());
View Full Code Here

    assertTrue("Link is a Javascript command", linkTag.isJavascriptLink());
  }

  public void testNotJavascriptLink() throws ParserException {
    createParser("<A HREF=\"javascript_not.html\">say hello</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];

    assertEquals("Link Plain Text", "say hello", linkTag.toPlainTextString());
View Full Code Here

    assertTrue("Link is not a Javascript command", !linkTag.isJavascriptLink());
  }

  public void testFTPLink() throws ParserException {
    createParser("<A HREF=\"ftp://some.where.it\">my ftp</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];

    assertEquals("Link Plain Text", "my ftp", linkTag.toPlainTextString());
View Full Code Here

    assertTrue("Link is a FTP site", linkTag.isFTPLink());
  }

  public void testNotFTPLink() throws ParserException {
    createParser("<A HREF=\"ftp.html\">my ftp</A>", "http://www.cj.com/");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];

    assertEquals("Link Plain Text", "my ftp", linkTag.toPlainTextString());
View Full Code Here

    assertTrue("Link is not a FTP site", !linkTag.isFTPLink());
  }

  public void testRelativeLinkNotHTMLBug() throws ParserException {
    createParser("<A HREF=\"newpage.html\">New Page</A>", "http://www.mysite.com/books/some.asp");
    parser.addScanner(new LinkScanner("-l"));
    parseAndAssertNodeCount(1);
    assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
    LinkTag linkTag = (LinkTag) node[0];
    assertEquals("Link", "http://www.mysite.com/books/newpage.html", linkTag.getLink());
  }
View Full Code Here

    LinkTag linkTag = (LinkTag) node[0];
    assertStringEquals("expected link", "<%=Application(\"sURL\")%>/literature/index.htm", linkTag.getLink());
  }

  public void testLinkScannerFilter() throws Exception {
    LinkScanner linkScanner = new LinkScanner(LinkTag.LINK_TAG_FILTER);
    assertEquals("linkscanner filter", LinkTag.LINK_TAG_FILTER, linkScanner.getFilter());
  }
View Full Code Here

TOP

Related Classes of org.htmlparser.scanners.LinkScanner

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.