Package org.htmlparser.tags

Examples of org.htmlparser.tags.LinkTag


            "<A HREF=\"mailto:this@is.real\">this@is.real</A>",
            "http://www.cj.com/");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];
        assertEquals(
            "Link Plain Text",
            "this@is.real",
            linkTag.toPlainTextString());
        assertTrue("Link is a mail link", linkTag.isMailLink());
    }
View Full Code Here


            "<A HREF=\"javascript:alert('hello');\">say hello</A>",
            "http://www.cj.com/");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];

        assertEquals(
            "Link Plain Text",
            "say hello",
            linkTag.toPlainTextString());
        assertTrue("Link is a Javascript command", linkTag.isJavascriptLink());
    }
View Full Code Here

            "<A HREF=\"javascript_not.html\">say hello</A>",
            "http://www.cj.com/");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];

        assertEquals(
            "Link Plain Text",
            "say hello",
            linkTag.toPlainTextString());
        assertTrue(
            "Link is not a Javascript command",
            !linkTag.isJavascriptLink());
    }
View Full Code Here

            "<A HREF=\"ftp://some.where.it\">my ftp</A>",
            "http://www.cj.com/");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];

        assertEquals("Link Plain Text", "my ftp", linkTag.toPlainTextString());
        assertTrue("Link is a FTP site", linkTag.isFTPLink());
    }
View Full Code Here

    {
        createParser("<A HREF=\"ftp.html\">my ftp</A>", "http://www.cj.com/");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];

        assertEquals("Link Plain Text", "my ftp", linkTag.toPlainTextString());
        assertTrue("Link is not a FTP site", !linkTag.isFTPLink());
    }
View Full Code Here

            "<A HREF=\"newpage.html\">New Page</A>",
            "http://www.mysite.com/books/some.asp");
        parser.addScanner(new LinkScanner("-l"));
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];
        assertEquals(
            "Link",
            "http://www.mysite.com/books/newpage.html",
            linkTag.getLink());
    }
View Full Code Here

            "<a href=\"registration.asp?EventID=1272\"><img border=\"0\" src=\"\\images\\register.gif\"</a>",
            "http://www.fedpage.com/Event.asp?EventID=1272");
        parser.registerScanners();
        parseAndAssertNodeCount(1);
        assertTrue("Node should be a HTMLLinkTag", node[0] instanceof LinkTag);
        LinkTag linkTag = (LinkTag) node[0];
        // Get the image tag from the link

        Node insideNodes[] = new Node[10];
        int j = 0;
        for (SimpleNodeIterator e = linkTag.children(); e.hasMoreNodes();)
        {
            insideNodes[j++] = (Node) e.nextNode();
        }
        assertEquals("Number of contained internal nodes", 1, j);
        assertTrue(insideNodes[0] instanceof ImageTag);
View Full Code Here

            "<a class=rlbA href=/news/866201.asp?0sl=-"
                + "32>Shoe bomber handed life sentence</a>");
        parser.registerScanners();
        parseAndAssertNodeCount(1);
        assertType("node type", LinkTag.class, node[0]);
        LinkTag linkTag = (LinkTag) node[0];
        assertStringEquals(
            "link text",
            "Shoe bomber handed life sentence",
            linkTag.getLinkText());
        assertStringEquals(
            "link url",
            "/news/866201.asp?0sl=-32",
            linkTag.getLink());
    }
View Full Code Here

            "<a href=\"<%=Application(\"sURL\")% "
                + ">/literature/index.htm\">Literature</a>");
        parser.registerScanners();
        parseAndAssertNodeCount(1);
        assertType("should be link tag", LinkTag.class, node[0]);
        LinkTag linkTag = (LinkTag) node[0];
        assertStringEquals(
            "expected link",
            "<%=Application(\"sURL\")%>/literature/index.htm",
            linkTag.getLink());
    }
View Full Code Here

    protected URL[] extractLinks(String url) throws ParserException
    {
        Parser parser;
        Vector vector;
        Node node;
        LinkTag link;
        URL[] ret;

        parser = new Parser(url);
        parser.registerScanners();
        ObjectFindingVisitor visitor = new ObjectFindingVisitor(LinkTag.class);
        parser.visitAllNodesWith(visitor);
        Node[] nodes = visitor.getTags();
        vector = new Vector();
        for (int i = 0; i < nodes.length; i++)
            try
            {
                link = (LinkTag) nodes[i];
                vector.add(new URL(link.getLink()));
            }
            catch (MalformedURLException murle)
            {
                //vector.remove (i);
                //i--;
View Full Code Here

TOP

Related Classes of org.htmlparser.tags.LinkTag

Copyright © 2018 www.massapicom. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.