Package com.alee.utils

Source Code of com.alee.utils.HtmlUtils

/*
* This file is part of WebLookAndFeel library.
*
* WebLookAndFeel library is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* WebLookAndFeel library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with WebLookAndFeel library.  If not, see <http://www.gnu.org/licenses/>.
*/

package com.alee.utils;

import net.htmlparser.jericho.HTMLElementName;
import net.htmlparser.jericho.Renderer;
import net.htmlparser.jericho.Source;
import net.htmlparser.jericho.Tag;

/**
* This class provides a set of utilities to work with HTML.
*
* @author Mikle Garin
*/

public final class HtmlUtils
{
    public static final String DEFAULT_LINE_SEPARATOR = "\n";

    /**
     * Returns plain text extracted from the specified HTML.
     *
     * @param html HTML
     * @return plain text
     */
    public static String getPlainText ( final String html )
    {
        return getPlainText ( html, DEFAULT_LINE_SEPARATOR );
    }

    /**
     * Returns plain text extracted from the specified HTML.
     *
     * @param html          HTML
     * @param lineSeparator line separator
     * @return plain text
     */
    public static String getPlainText ( final String html, final String lineSeparator )
    {
        final Source source = new Source ( html );
        final Tag[] tags = source.fullSequentialParse ();
        if ( tags.length > 0 )
        {
            final Renderer renderer = source.getRenderer ();
            renderer.setIncludeHyperlinkURLs ( false );
            renderer.setIncludeAlternateText ( false );
            renderer.setDecorateFontStyles ( false );
            renderer.setMaxLineLength ( Integer.MAX_VALUE );
            renderer.setBlockIndentSize ( 4 );
            renderer.setConvertNonBreakingSpaces ( false );
            renderer.setNewLine ( lineSeparator );
            return renderer.toString ();
        }
        else
        {
            return html;
        }
    }

    /**
     * Returns HTML with specified text made bold.
     *
     * @param text text to process
     * @return HTML with specified text made bold
     */
    public static String bold ( final String text )
    {
        return "<html><b>" + text + "</b></html>";
    }

    /**
     * Returns whether the specified text contains HTML tags or not.
     *
     * @param text text to process
     * @return true if the specified text contains HTML tags, false otherwise
     */
    public static boolean hasTags ( final String text )
    {
        return text != null && text.trim ().length () > 0 && new Source ( text ).fullSequentialParse ().length > 0;
    }

    /**
     * Returns whether specified text contains HTML tag or not.
     *
     * @param text text to process
     * @return true if specified text contains HTML tag, false otherwise
     */
    public static boolean hasHtml ( final String text )
    {
        return hasTag ( text, HTMLElementName.HTML );
    }

    /**
     * Returns whether text contains the specified tag or not.
     *
     * @param text text to process
     * @param tag  tag to find
     * @return true if text contains the specified tag, false otherwise
     */
    public static boolean hasTag ( final String text, final String tag )
    {
        if ( text != null && text.trim ().length () > 0 )
        {
            final Source source = new Source ( text );
            source.fullSequentialParse ();
            return source.getFirstElement ( tag ) != null;
        }
        else
        {
            return false;
        }
    }

    /**
     * Returns HTML content between body or html tags.
     *
     * @param text text to process
     * @return HTML content between body or html tags
     */
    public static String getContent ( final String text )
    {
        final String lowerCaseText = text.toLowerCase ();

        final String bodyTag = "<body>";
        final int body = lowerCaseText.indexOf ( bodyTag );
        final int bodyEnd = lowerCaseText.indexOf ( "</body>" );
        if ( body != -1 && bodyEnd != -1 )
        {
            return text.substring ( body + bodyTag.length (), bodyEnd );
        }

        final String htmlTag = "<html>";
        final int html = lowerCaseText.indexOf ( bodyTag );
        final int htmlEnd = lowerCaseText.indexOf ( "</html>" );
        if ( html != -1 && htmlEnd != -1 )
        {
            return text.substring ( html + htmlTag.length (), htmlEnd );
        }

        return text;
    }

    /**
     * Returns text converted into multiline HTML.
     *
     * @param text      text to convert
     * @param lineBreak line break text
     * @return text converted into multiline HTML
     */
    public static String convertToMultilineHtml ( final String text, final String... lineBreak )
    {
        String body = text;
        for ( final String divider : lineBreak )
        {
            body = body.replaceAll ( divider, "<br>" );
        }
        return "<html>" + body + "</html>";
    }
}
TOP

Related Classes of com.alee.utils.HtmlUtils

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.