Package org.pdf4j.saxon.event

Source Code of org.pdf4j.saxon.event.XHTMLURIEscaper

package org.pdf4j.saxon.event;

import org.pdf4j.saxon.codenorm.Normalizer;
import org.pdf4j.saxon.om.NamePool;
import org.pdf4j.saxon.om.NamespaceConstant;
import org.pdf4j.saxon.trans.XPathException;

import java.util.HashSet;


/**
* This class performs URI escaping for the XHTML output method. The logic for performing escaping
* is the same as the HTML output method, but the way in which attributes are identified for escaping
* is different, because XHTML is case-sensitive.
*/

public class XHTMLURIEscaper extends HTMLURIEscaper {

    /**
    * Table of attributes whose value is a URL
    */

    private HashSet urlTable;

    private synchronized void buildURIAttributeTable() {
        // Reuse the attribute table for all XHTMLEmitters sharing the same namepool
        NamePool pool = getPipelineConfiguration().getConfiguration().getNamePool();
        urlTable = (HashSet)pool.getClientData(this.getClass());
        if (urlTable == null) {
            urlTable = new HashSet(40);
            pool.setClientData(this.getClass(), urlTable);
        }
        setUrlAttribute(pool, "form", "action");
        setUrlAttribute(pool, "object", "archive");
        setUrlAttribute(pool, "body", "background");
        setUrlAttribute(pool, "q", "cite");
        setUrlAttribute(pool, "blockquote", "cite");
        setUrlAttribute(pool, "del", "cite");
        setUrlAttribute(pool, "ins", "cite");
        setUrlAttribute(pool, "object", "classid");
        setUrlAttribute(pool, "object", "codebase");
        setUrlAttribute(pool, "applet", "codebase");
        setUrlAttribute(pool, "object", "data");
        setUrlAttribute(pool, "button", "datasrc");
        setUrlAttribute(pool, "div", "datasrc");
        setUrlAttribute(pool, "input", "datasrc");
        setUrlAttribute(pool, "object", "datasrc");
        setUrlAttribute(pool, "select", "datasrc");
        setUrlAttribute(pool, "span", "datasrc");
        setUrlAttribute(pool, "table", "datasrc");
        setUrlAttribute(pool, "textarea", "datasrc");
        setUrlAttribute(pool, "script", "for");
        setUrlAttribute(pool, "a", "href");
        setUrlAttribute(pool, "a", "name");       // see second note in section B.2.1 of HTML 4 specification
        setUrlAttribute(pool, "area", "href");
        setUrlAttribute(pool, "link", "href");
        setUrlAttribute(pool, "base", "href");
        setUrlAttribute(pool, "img", "longdesc");
        setUrlAttribute(pool, "frame", "longdesc");
        setUrlAttribute(pool, "iframe", "longdesc");
        setUrlAttribute(pool, "head", "profile");
        setUrlAttribute(pool, "script", "src");
        setUrlAttribute(pool, "input", "src");
        setUrlAttribute(pool, "frame", "src");
        setUrlAttribute(pool, "iframe", "src");
        setUrlAttribute(pool, "img", "src");
        setUrlAttribute(pool, "img", "usemap");
        setUrlAttribute(pool, "input", "usemap");
        setUrlAttribute(pool, "object", "usemap");
    }

    private void setUrlAttribute(NamePool pool, String element, String attribute) {
        int elcode = pool.allocate("", NamespaceConstant.XHTML, element) & NamePool.FP_MASK;
        int atcode = pool.allocate("", "", attribute) & NamePool.FP_MASK;
        Long key = new Long(((long)elcode)<<32 | (long)atcode);
        urlTable.add(key);
    }

    /**
     * Determine whether a given attribute is a URL attribute
     */

    private boolean isURLAttribute(int elcode, int atcode) {
        elcode = elcode & NamePool.FP_MASK;
        atcode = atcode & NamePool.FP_MASK;
        Long key = new Long(((long)elcode)<<32 | (long)atcode);
        return urlTable.contains(key);
    }

    /**
     * Do the real work of starting the document. This happens when the first
     * content is written.
     *
     * @throws org.pdf4j.saxon.trans.XPathException
     *
     */

    public void open() throws XPathException {
        super.open();
        if (escapeURIAttributes) {
            buildURIAttributeTable();
        }
    }

    /**
     * Notify an attribute. Attributes are notified after the startElement event, and before any
     * children. Namespaces and attributes may be intermingled.
     *
     * @param nameCode   The name of the attribute, as held in the name pool
     * @param typeCode   The type of the attribute, as held in the name pool
     * @param properties Bit significant value. The following bits are defined:
     *                   <dd>DISABLE_ESCAPING</dd>    <dt>Disable escaping for this attribute</dt>
     *                   <dd>NO_SPECIAL_CHARACTERS</dd>      <dt>Attribute value contains no special characters</dt>
     * @throws IllegalStateException: attempt to output an attribute when there is no open element
     *                                start tag
     */

    public void attribute(int nameCode, int typeCode, CharSequence value, int locationId, int properties) throws XPathException {
        if (escapeURIAttributes &&
                isURLAttribute(currentElement, nameCode) &&
                (properties & ReceiverOptions.DISABLE_ESCAPING) == 0) {
            CharSequence normalized = new Normalizer(Normalizer.C).normalize(value);
            getUnderlyingReceiver().attribute(
                    nameCode, typeCode, HTMLURIEscaper.escapeURL(normalized, true), locationId,
                    properties | ReceiverOptions.DISABLE_CHARACTER_MAPS);
        } else {
            getUnderlyingReceiver().attribute(
                    nameCode, typeCode, value, locationId, properties);
        }
    }

}

//
// The contents of this file are subject to the Mozilla Public License Version 1.0 (the "License");
// you may not use this file except in compliance with the License. You may obtain a copy of the
// License at http://www.mozilla.org/MPL/
//
// Software distributed under the License is distributed on an "AS IS" basis,
// WITHOUT WARRANTY OF ANY KIND, either express or implied.
// See the License for the specific language governing rights and limitations under the License.
//
// The Original Code is: all this file.
//
// The Initial Developer of the Original Code is Michael H. Kay.
//
// Portions created by (your name) are Copyright (C) (your legal entity). All Rights Reserved.
//
// Contributor(s): none.
//
TOP

Related Classes of org.pdf4j.saxon.event.XHTMLURIEscaper

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.