Package org.pdf4j.saxon

Source Code of org.pdf4j.saxon.Transform

package org.pdf4j.saxon;

import org.pdf4j.saxon.event.Builder;
import org.pdf4j.saxon.event.Receiver;
import org.pdf4j.saxon.event.SaxonOutputKeys;
import org.pdf4j.saxon.instruct.TerminationException;
import org.pdf4j.saxon.om.Validation;
import org.pdf4j.saxon.trace.ExpressionPresenter;
import org.pdf4j.saxon.trace.TraceListener;
import org.pdf4j.saxon.trans.XPathException;
import org.pdf4j.saxon.value.UntypedAtomicValue;
import org.xml.sax.InputSource;
import org.xml.sax.XMLReader;

import javax.xml.transform.*;
import javax.xml.transform.sax.SAXSource;
import javax.xml.transform.stream.StreamResult;
import javax.xml.transform.stream.StreamSource;

import java.io.File;
import java.io.FileOutputStream;
import java.io.OutputStream;
import java.io.PrintStream;
import java.net.URI;
import java.net.URISyntaxException;
import java.util.ArrayList;
import java.util.Date;
import java.util.List;
import java.util.Properties;

/**
* This <B>Transform</B> class is the entry point to the Saxon XSLT Processor. This
* class is provided to control the processor from the command line.<p>
* <p/>
* The XSLT syntax supported conforms to the W3C XSLT 1.0 and XPath 1.0 recommendation.
* Only the transformation language is implemented (not the formatting objects).
* Saxon extensions are documented in the file extensions.html
*
* @author Michael H. Kay
*/

public class Transform {

    protected TransformerFactoryImpl factory;
    protected Configuration config;
    protected boolean useURLs = false;
    protected boolean showTime = false;
    protected int repeat = 1;
    String sourceParserName = null;

    /**
     * Main program, can be used directly from the command line.
     * <p>The format is:</P>
     * <p>java org.orbeon.saxon.Transform [options] <I>source-file</I> <I>style-file</I> &gt;<I>output-file</I></P>
     * <p>followed by any number of parameters in the form {keyword=value}... which can be
     * referenced from within the stylesheet.</p>
     * <p>This program applies the XSL style sheet in style-file to the source XML document in source-file.</p>
     *
     * @param args List of arguments supplied on operating system command line
     * @throws java.lang.Exception Indicates that a compile-time or
     *                             run-time error occurred
     */

    public static void main(String args[])
            throws java.lang.Exception {
        // the real work is delegated to another routine so that it can be used in a subclass
        (new Transform()).doTransform(args, "java org.orbeon.saxon.Transform");
    }

    /**
     * Set the configuration in the TransformerFactory. This is designed to be
     * overridden in a subclass
     * @param schemaAware True if the transformation is to be schema-aware
     * @param className Name of the schema-aware Configuration class to be loaded. Designed for use by .NET;
     * can normally be null.
     */

    public void setFactoryConfiguration(boolean schemaAware, String className) throws RuntimeException {
        if (schemaAware) {
            config = Configuration.makeSchemaAwareConfiguration(null, className);
        } else {
            config = new Configuration();
            // In basic XSLT, all nodes are untyped when calling from the command line
            config.setAllNodesUntyped(true);
        }
        factory = new TransformerFactoryImpl(config);
    }

    /**
     * Support method for main program. This support method can also be invoked from subclasses
     * that support the same command line interface
     *
     * @param args the command-line arguments
     * @param command the form of the command as written by the user, to be used in error messages
     */

    public void doTransform(String args[], String command) {


        String sourceFileName = null;
        String styleFileName = null;
        File outputFile = null;
        ArrayList parameterList = new ArrayList(20);
        String outputFileName = null;
        String initialMode = null;
        String initialTemplate = null;
        boolean useAssociatedStylesheet = false;
        boolean wholeDirectory = false;
        boolean precompiled = false;
        boolean dtdValidation = false;
        String styleParserName = null;
        boolean explain = false;
        String explainOutputFileName = null;
        String additionalSchemas = null;
        PrintStream traceDestination = System.err;
        boolean closeTraceDestination = false;

        boolean schemaAware = false;
        for (int i=0; i<args.length; i++) {
            if (args[i].equals("-sa") ||
                    args[i].startsWith("-sa:") ||
                    args[i].startsWith("-val:") ||
                    args[i].equals("-val") ||
                    args[i].equals("-vlax") ||
                    args[i].startsWith("-xsd:") ||
                    args[i].startsWith("-xsdversion:") ||
                    args[i].equals("-p")) {
                schemaAware = true;
                break;
            }
        }

        try {
            setFactoryConfiguration(schemaAware, null);
        } catch (Exception err) {
            err.printStackTrace();
            quit(err.getMessage(), 2);
        }
        config = factory.getConfiguration();
        config.setVersionWarning(true)// unless suppressed by command line options
        schemaAware = config.isSchemaAware(Configuration.XSLT);

        // Check the command-line arguments.

        try {
            int i = 0;
            while (true) {
                if (i >= args.length) {
                    break;
                }

                if (args[i].charAt(0) == '-') {
                    String option;
                    String value = null;
                    int colon = args[i].indexOf(':');
                    if (colon > 0 && colon < args[i].length() - 1) {
                        option = args[i].substring(1, colon);
                        value = args[i].substring(colon+1);
                    } else {
                        option = args[i].substring(1);
                    }
                    if (option.equals("a")) {
                        useAssociatedStylesheet = true;
                        i++;
                    } else if (option.equals("c")) {
                        precompiled = true;
                        if (value != null) {
                            styleFileName = value;
                        }
                        i++;
                    } else if (option.equals("cr")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No resolver after -cr");
                            }
                            value = args[i++];
                        }
                        Object resolver = config.getInstance(value, null);
                        factory.setAttribute(FeatureKeys.COLLECTION_URI_RESOLVER, resolver);
                    } else if (option.equals("ds")) {
                        factory.setAttribute(FeatureKeys.TREE_MODEL,
                                new Integer(Builder.LINKED_TREE));
                        i++;
                    } else if (option.equals("dt")) {
                        factory.setAttribute(FeatureKeys.TREE_MODEL,
                                new Integer(Builder.TINY_TREE));
                        i++;
                    } else if (option.equals("dtd")) {
                        if (!("on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-dtd option must be -dtd:on or -dtd:off");
                        }
                        factory.setAttribute(FeatureKeys.DTD_VALIDATION,
                                    Boolean.valueOf("on".equals(value)));
                        i++;
                    } else if (option.equals("expand")) {
                        if (!("on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-expand option must be 'on' or 'off'");
                        }
                        factory.setAttribute(FeatureKeys.EXPAND_ATTRIBUTE_DEFAULTS,
                                    Boolean.valueOf("on".equals(value)));
                        i++;                       
                    } else if (option.equals("explain")) {
                        explain = true;
                        explainOutputFileName = value; // may be omitted/null
                        factory.setAttribute(FeatureKeys.TRACE_OPTIMIZER_DECISIONS, Boolean.TRUE);
                        i++;
                    } else if (option.equals("ext")) {
                        if (!("on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-ext option must be -ext:on or -ext:off");
                        }
                        factory.setAttribute(FeatureKeys.ALLOW_EXTERNAL_FUNCTIONS,
                                    Boolean.valueOf("on".equals(value)));
                        i++;
                    } else if (option.equals("im")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No initial mode after -im");
                            }
                            value = args[i++];
                        }
                        initialMode = value;
                    } else if (option.equals("it")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No initial template after -it");
                            }
                            value = args[i++];
                        }
                        initialTemplate = value;
                    } else if (option.equals("l")) {
                        if (!(value==null || "on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-l option must be -l:on or -l:off");
                        }
                        factory.setAttribute(FeatureKeys.LINE_NUMBERING,
                                Boolean.valueOf(!"off".equals(value)));
                        i++;
                    } else if (option.equals("m")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No message receiver class after -m");
                            }
                            value = args[i++];
                        }
                        factory.setAttribute(FeatureKeys.MESSAGE_EMITTER_CLASS, value);
                    } else if (option.equals("noext")) {
                        i++;
                        factory.setAttribute(FeatureKeys.ALLOW_EXTERNAL_FUNCTIONS,
                                Boolean.valueOf(false));
                    } else if (option.equals("novw")) {
                        factory.setAttribute(FeatureKeys.VERSION_WARNING,
                                Boolean.valueOf(false));
                        i++;
                    } else if (option.equals("o")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No output file name after -o");
                            }
                            value = args[i++];
                        }
                        outputFileName = value;

                    } else if (option.equals("or")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No output resolver class after -or");
                            }
                            value = args[i++];
                        }
                        String orclass = value;
                        Object resolver = config.getInstance(orclass, null);
                        factory.setAttribute(FeatureKeys.OUTPUT_URI_RESOLVER, resolver);

                    } else if (option.equals("outval")) {
                        if (schemaAware) {
                            if (!(value==null || "recover".equals(value) || "fatal".equals(value))) {
                                badUsage(command, "-outval option must be 'recover' or 'fatal'");
                            }
                            factory.setAttribute(FeatureKeys.VALIDATION_WARNINGS,
                                    Boolean.valueOf("recover".equals(value)));
                        } else {
                            quit("The -outval option requires a schema-aware processor", 2);
                        }
                        i++;
                    } else if (option.equals("p")) {
                        i++;
                        if (!(value==null || "on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-p option must be -p:on or -p:off");
                        }
                        if (!"off".equals(value)) {
                            //setPOption(config);
                            config.setParameterizedURIResolver();
                            useURLs = true;
                        }
                    } else if (option.equals("r")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No URIesolver class after -r");
                            }
                            value = args[i++];
                        }
                        factory.setURIResolver(config.makeURIResolver(value));
                    } else if (option.equals("repeat")) {
                        i++;
                        if (value == null) {
                            badUsage(command, "No number after -repeat");
                        } else {
                            try {
                                repeat = Integer.parseInt(value);
                            } catch (NumberFormatException err) {
                                badUsage(command, "Bad number after -repeat");
                            }
                        }
                    } else if (option.equals("s")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No source file name after -s");
                            }
                            value = args[i++];
                        }
                        sourceFileName = value;
                    } else if (option.equals("sa")) {
                        // already handled
                        i++;
                    } else if (option.equals("snone")) {
                        factory.setAttribute(FeatureKeys.STRIP_WHITESPACE, "none");
                        i++;
                    } else if (option.equals("sall")) {
                        factory.setAttribute(FeatureKeys.STRIP_WHITESPACE, "all");
                        i++;
                    } else if (option.equals("signorable")) {
                        factory.setAttribute(FeatureKeys.STRIP_WHITESPACE, "ignorable");
                        i++;
                    } else if (option.equals("strip")) {
                        if ("none".equals(value) || "all".equals(value) || "ignorable".equals(value)) {
                            factory.setAttribute(FeatureKeys.STRIP_WHITESPACE, value);
                            i++;
                        } else {
                            badUsage(command, "-strip must be none, all, or ignorable");
                        }
                    } else if (option.equals("t")) {
                        if (!showTime) {
                            // don't do it twice if the option appears twice
                            System.err.println(config.getProductTitle());
                            System.err.println(Configuration.getPlatform().getPlatformVersion());
                            factory.setAttribute(FeatureKeys.TIMING, Boolean.valueOf(true));
                            showTime = true;
                        }
                        i++;
                    } else if (option.equals("T")) {
                        i++;
                        TraceListener traceListener;
                        if (value == null) {
                            traceListener = new org.pdf4j.saxon.trace.XSLTTraceListener();
                        } else {
                            traceListener = config.makeTraceListener(value);
                        }
                        factory.setAttribute(FeatureKeys.TRACE_LISTENER, traceListener);
                        factory.setAttribute(FeatureKeys.LINE_NUMBERING, Boolean.TRUE);

                    } else if (option.equals("TJ")) {
                        i++;
                        factory.setAttribute(FeatureKeys.TRACE_EXTERNAL_FUNCTIONS,
                                Boolean.TRUE);
                    } else if (option.equals("TL")) {
                        i++;
                        if (args.length < i + 2) {
                            badUsage(command, "No TraceListener class");
                        }
                        TraceListener traceListener = config.makeTraceListener(args[i++]);
                        factory.setAttribute(FeatureKeys.TRACE_LISTENER,
                                traceListener);
                        factory.setAttribute(FeatureKeys.LINE_NUMBERING,
                                Boolean.TRUE);
                    } else if (option.equals("TP")) {
                        i++;
                        TraceListener traceListener = new org.pdf4j.saxon.trace.TimedTraceListener();
                        factory.setAttribute(FeatureKeys.TRACE_LISTENER,
                                traceListener);
                        factory.setAttribute(FeatureKeys.LINE_NUMBERING,
                                Boolean.TRUE);
                    } else if (option.equals("traceout")) {
                        i++;
                        if (value.equals("#err")) {
                            // no action, this is the default
                        } else if (value.equals("#out")) {
                            traceDestination = System.out;
                        } else if (value.equals("#null")) {
                            traceDestination = null;
                        } else {
                            traceDestination = new PrintStream(new FileOutputStream(new File(value)));
                            closeTraceDestination = true;
                        }

                    } else if (option.equals("tree")) {
                        if ("linked".equals(value)) {
                            factory.setAttribute(FeatureKeys.TREE_MODEL,
                                    new Integer(Builder.LINKED_TREE));
                        } else if ("tiny".equals(value)) {
                            factory.setAttribute(FeatureKeys.TREE_MODEL,
                                new Integer(Builder.TINY_TREE));
                        } else {
                            badUsage(command, "-tree option must be 'linked' or 'tiny'");
                        }
                        i++;
                    } else if (option.equals("u")) {
                        useURLs = true;
                        i++;
                    } else if (option.equals("v")) {
                        factory.setAttribute(FeatureKeys.DTD_VALIDATION,
                                Boolean.valueOf(true));
                        dtdValidation = true;
                        i++;
                    } else if (option.equals("val")) {
                        if (!schemaAware) {
                            badUsage(command, "The -val option requires a schema-aware processor");
                        } else if (value==null || "strict".equals(value)) {
                                factory.setAttribute(FeatureKeys.SCHEMA_VALIDATION,
                                    new Integer(Validation.STRICT));
                        } else if ("lax".equals(value)) {
                            factory.setAttribute(FeatureKeys.SCHEMA_VALIDATION,
                                new Integer(Validation.LAX));
                        } else {
                            badUsage(command, "-val option must be 'strict' or 'lax'");
                        }
                        i++;
                    } else if (option.equals("vlax")) {
                        if (schemaAware) {
                            factory.setAttribute(FeatureKeys.SCHEMA_VALIDATION,
                                    new Integer(Validation.LAX));
                        } else {
                            quit("The -vlax option requires a schema-aware processor", 2);
                        }
                        i++;
                    } else if (option.equals("versionmsg")) {
                        if (!("on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-versionmsg option must be -versionmsg:on or -versionmsg:off");
                        }
                        factory.setAttribute(FeatureKeys.VERSION_WARNING,
                                    Boolean.valueOf("on".equals(value)));
                        i++;
                    } else if (option.equals("vw")) {
                        if (schemaAware) {
                            factory.setAttribute(FeatureKeys.VALIDATION_WARNINGS,
                                    Boolean.valueOf(true));
                        } else {
                            quit("The -vw option requires a schema-aware processor", 2);
                        }
                        i++;
                    } else if (option.equals("warnings")) {
                        if ("silent".equals(value)) {
                            factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.RECOVER_SILENTLY));
                        } else if ("recover".equals(value)) {
                            factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.RECOVER_WITH_WARNINGS));
                        } else if ("fatal".equals(value)) {
                            factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.DO_NOT_RECOVER));
                        }
                        i++;
                    } else if (option.equals("w0")) {
                        i++;
                        factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.RECOVER_SILENTLY));
                    } else if (option.equals("w1")) {
                        i++;
                        factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.RECOVER_WITH_WARNINGS));
                    } else if (option.equals("w2")) {
                        i++;
                        factory.setAttribute(FeatureKeys.RECOVERY_POLICY,
                                new Integer(Configuration.DO_NOT_RECOVER));

                    } else if (option.equals("x")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No source parser class after -x");
                            }
                            value = args[i++];
                        }
                        sourceParserName = value;
                        factory.setAttribute(FeatureKeys.SOURCE_PARSER_CLASS, sourceParserName);
                    } else if (option.equals("xi")) {
                        if (!(value==null || "on".equals(value) || "off".equals(value))) {
                            badUsage(command, "-xi option must be -xi:on or -xi:off");
                        }
                        if (!"off".equals(value)) {
                            factory.setAttribute(FeatureKeys.XINCLUDE, Boolean.TRUE);
                        }
                        i++;
                   } else if (option.equals("xmlversion")) {    // XML 1.1
                        i++;
                        if (!("1.0".equals(value) | "1.1".equals(value))) {
                            badUsage(command, "-xmlversion must be 1.0 or 1.1");
                        }
                        factory.setAttribute(FeatureKeys.XML_VERSION, value);
                    } else if (option.equals("xsd")) {
                        i++;
                        additionalSchemas = value;
                    } else if (option.equals("xsdversion")) {    // XSD 1.1
                        i++;
                        if (!("1.0".equals(value) | "1.1".equals(value))) {
                            badUsage(command, "-xsdversion must be 1.0 or 1.1");
                        }
                        config.setConfigurationProperty(FeatureKeys.XSD_VERSION, value);
                    } else if (option.equals("xsiloc")) {
                        i++;
                        if ("off".equals(value)) {
                            config.setConfigurationProperty(FeatureKeys.USE_XSI_SCHEMA_LOCATION, Boolean.FALSE);
                        } else if ("on".equals(value)) {
                            config.setConfigurationProperty(FeatureKeys.USE_XSI_SCHEMA_LOCATION, Boolean.TRUE);
                        } else {
                            badUsage(value, "format: -xsiloc:(on|off)");
                        }
                    } else if (option.equals("xsl")) {
                        i++;
                        styleFileName = value;
                    } else if (option.equals("y")) {
                        i++;
                        if (value == null) {
                            if (args.length < i + 2) {
                                badUsage(command, "No stylesheet parser class after -y");
                            }
                            value = args[i++];
                        }
                        styleParserName = value;
                        factory.setAttribute(FeatureKeys.STYLE_PARSER_CLASS, value);

                    } else if (option.equals("1.1")) {    // XML 1.1
                        i++;
                        factory.setAttribute(FeatureKeys.XML_VERSION, "1.1");

                    } else if (args[i].equals("-?")) {
                        badUsage(command, "");
                    } else if (args[i].equals("-")) {
                        break;
                        // this means take the source from standard input
                    } else {
                        badUsage(command, "Unknown option " + args[i]);
                    }
                } else {
                    break;
                }
            }

            if (initialTemplate != null && useAssociatedStylesheet) {
                badUsage(command, "-it and -a options cannot be used together");
            }

            if (initialTemplate == null && sourceFileName == null) {
                if (args.length < i + 1) {
                    badUsage(command, "No source file name");
                }
                sourceFileName = args[i++];
            }

            if (!useAssociatedStylesheet && styleFileName == null) {
                if (args.length < i + 1) {
                    badUsage(command, "No stylesheet file name");
                }
                styleFileName = args[i++];
            }

            for (int p = i; p < args.length; p++) {
                String arg = args[p];
                int eq = arg.indexOf("=");
                if (eq < 1 || eq >= arg.length()) {
                    badUsage(command, "Bad param=value pair on command line: " + arg);
                }
                parameterList.add(arg);
            }

            config.displayLicenseMessage();

            if (additionalSchemas != null) {
                Query.loadAdditionalSchemas(config, additionalSchemas);
            }

            List sources = null;
            if (sourceFileName != null) {
                boolean useSAXSource = sourceParserName != null || dtdValidation;
                Object loaded = loadDocuments(sourceFileName, useURLs, config, useSAXSource);
                if (loaded instanceof List) {
                    wholeDirectory = true;
                    sources = (List)loaded;
                } else {
                    wholeDirectory = false;
                    sources = new ArrayList(1);
                    sources.add(loaded);
                }
                sources = preprocess(sources);
                if (wholeDirectory) {
                    if (outputFileName == null) {
                        quit("To process a directory, -o must be specified", 2);
                    } else if (outputFileName.equals(sourceFileName)) {
                        quit("Output directory must be different from input", 2);
                    } else {
                        outputFile = new File(outputFileName);
                        if (!outputFile.isDirectory()) {
                            quit("Input is a directory, but output is not", 2);
                        }
                    }
                }
            }

            if (outputFileName != null && !wholeDirectory) {
                outputFile = new File(outputFileName);
                if (outputFile.isDirectory()) {
                    quit("Output is a directory, but input is not", 2);
                }
            }

            if (useAssociatedStylesheet) {
                if (wholeDirectory) {
                    processDirectoryAssoc(sources, outputFile, parameterList,
                            initialMode, traceDestination);
                } else {
                    processFileAssoc((Source)sources.get(0), null, outputFile, parameterList,
                            initialMode, traceDestination);
                }
            } else {

                long startTime = (new Date()).getTime();

                PreparedStylesheet sheet = null;

                if (precompiled) {
                    try {
                        sheet = PreparedStylesheet.loadCompiledStylesheet(config, styleFileName);
                        if (showTime) {
                            long endTime = (new Date()).getTime();
                            System.err.println("Stylesheet loading time: " + (endTime - startTime) + " milliseconds");
                        }
                    } catch (Exception err) {
                        err.printStackTrace();
                    }
                } else {
                    Source styleSource;
                    XMLReader styleParser = null;
                    if (useURLs || styleFileName.startsWith("http:")
                            || styleFileName.startsWith("file:")) {
                        styleSource = config.getURIResolver().resolve(styleFileName, null);
                        if (styleSource == null) {
                            styleSource = config.getSystemURIResolver().resolve(styleFileName, null);
                        }
                    } else if (styleFileName.equals("-")) {
                        // take input from stdin
                        if (styleParserName == null) {
                            styleSource = new StreamSource(System.in);
                        } else if (Configuration.getPlatform().isJava()) {
                            styleParser = config.getStyleParser();
                            styleSource = new SAXSource(styleParser, new InputSource(System.in));
                        } else {
                            styleSource = new StreamSource(System.in);
                        }
                    } else {
                        File sheetFile = new File(styleFileName);
                        if (!sheetFile.exists()) {
                            quit("Stylesheet file " + sheetFile + " does not exist", 2);
                        }
                        if (styleParserName == null) {
                            styleSource = new StreamSource(sheetFile.toURI().toString());
                        } else {
                            InputSource eis = new InputSource(sheetFile.toURI().toString());
                            styleParser = config.getStyleParser();
                            styleSource = new SAXSource(styleParser, eis);
                        }
                    }

                    if (styleSource == null) {
                        quit("URIResolver for stylesheet file must return a Source", 2);
                    }

                    sheet = (PreparedStylesheet)factory.newTemplates(styleSource);
                    if (styleParser != null) {
                        config.reuseStyleParser(styleParser);
                        // pointless, because the Configuration won't be used again; but we want to set a good example
                    }
                    if (showTime) {
                        long endTime = now();
                        System.err.println("Stylesheet compilation time: " + (endTime - startTime) + " milliseconds");
                    }

                    if (explain) {
                        OutputStream explainOutput;
                        if (explainOutputFileName == null) {
                            explainOutput = System.err;
                        } else {
                            explainOutput = new FileOutputStream(new File(explainOutputFileName));
                        }
                        Properties props = new Properties();
                        props.setProperty(OutputKeys.METHOD, "xml");
                        props.setProperty(OutputKeys.INDENT, "yes");
                        props.setProperty(SaxonOutputKeys.INDENT_SPACES, "2");
                        Receiver diag = config.getSerializerFactory().getReceiver(
                                new StreamResult(explainOutput),
                                config.makePipelineConfiguration(),
                                props);
                        ExpressionPresenter expressionPresenter = new ExpressionPresenter(config, diag);
                        sheet.explain(expressionPresenter);
                        expressionPresenter.close();
                    }

                }

                if (wholeDirectory) {
                    processDirectory(sources, sheet, outputFile,
                            parameterList, initialTemplate, initialMode, traceDestination);
                } else {
                    Source source = (sources == null ? null : (Source)sources.get(0));
                    processFile(source, sheet, outputFile,
                            parameterList, initialTemplate, initialMode, traceDestination);
                }
                if (closeTraceDestination) {
                    traceDestination.close();
                }
            }
        } catch (TerminationException err) {
            quit(err.getMessage(), 1);
        } catch (TransformerConfigurationException err) {
            //err.printStackTrace();
            quit(err.getMessage(), 2);
        } catch (TransformerException err) {
            //err.printStackTrace();
            quit("Transformation failed: " + err.getMessage(), 2);
        } catch (TransformerFactoryConfigurationError err) {
            //err.printStackTrace();
            quit("Transformation failed: " + err.getMessage(), 2);
        } catch (Exception err2) {
            err2.printStackTrace();
            quit("Fatal error during transformation: " + err2.getClass().getName() + ": " +
                    (err2.getMessage() == null ? " (no message)" : err2.getMessage()), 2);
        }


        //System.exit(0);
    }

    /**
     * Preprocess the list of sources. This method exists so that it can be
     * overridden in a subclass
     * @param sources the list of Source objects
     * @return a revised list of Source objects
     */

    public List preprocess(List sources) throws XPathException {
        return sources;
    }

    /**
     * Get the configuration.
     * @return the Saxon configuration
     */

    protected Configuration getConfiguration() {
        return config;
    }

    /**
     * Exit with a message
     *
     * @param message The message to be output
     * @param code    The result code to be returned to the operating
     *                system shell
     */

    protected static void quit(String message, int code) {
        System.err.println(message);
        System.exit(code);
    }

    /**
     * Load a document, or all the documents in a directory, given a filename or URL
     * @param sourceFileName the name of the source file or directory
     * @param useURLs true if the filename argument is to be treated as a URI
     * @param config the Saxon configuration
     * @param useSAXSource true if the method should use a SAXSource rather than a StreamSource
     * @return if sourceFileName represents a single source document, return a Source object representing
     *         that document. If sourceFileName represents a directory, return a List containing multiple Source
     *         objects, one for each file in the directory.
     */

    public static Object loadDocuments(String sourceFileName, boolean useURLs,
                                       Configuration config, boolean useSAXSource)
            throws TransformerException {

        Source sourceInput;
        XMLReader parser;
        if (useURLs || sourceFileName.startsWith("http:") || sourceFileName.startsWith("file:")) {
            sourceInput = config.getURIResolver().resolve(sourceFileName, null);
            if (sourceInput == null) {
                sourceInput = config.getSystemURIResolver().resolve(sourceFileName, null);
            }
            return sourceInput;
        } else if (sourceFileName.equals("-")) {
            // take input from stdin
            if (useSAXSource) {
                parser = config.getSourceParser();
                sourceInput = new SAXSource(parser, new InputSource(System.in));
            } else {
                sourceInput = new StreamSource(System.in);
            }
            return sourceInput;
        } else {
            File sourceFile = new File(sourceFileName);
            if (!sourceFile.exists()) {
                quit("Source file " + sourceFile + " does not exist", 2);
            }
            if (sourceFile.isDirectory()) {
                parser = config.getSourceParser();
                List result = new ArrayList(20);
                String[] files = sourceFile.list();
                for (int f = 0; f < files.length; f++) {
                    File file = new File(sourceFile, files[f]);
                    if (!file.isDirectory()) {
                        if (useSAXSource) {
                            InputSource eis = new InputSource(file.toURI().toString());
                            sourceInput = new SAXSource(parser, eis);
                                // it's safe to use the same parser for each document, as they
                                // will be processed one at a time.
                        } else {
                            sourceInput = new StreamSource(file.toURI().toString());
                        }
                        result.add(sourceInput);
                    }
                }
                return result;
            } else {
                if (useSAXSource) {
                    InputSource eis = new InputSource(sourceFile.toURI().toString());
                    sourceInput = new SAXSource(config.getSourceParser(), eis);
                } else {
                    sourceInput = new StreamSource(sourceFile.toURI().toString());
                }
                return sourceInput;
            }
        }
    }

    /**
     * Process each file in the source directory using its own associated stylesheet
     *
     * @param sources       The sources in the directory to be processed
     * @param outputDir     The directory in which output files are to be
     *                      created
     * @param parameterList List of parameters to be supplied to each
     *                      transformation
     * @param initialMode   Initial mode for executing each
     *                      transformation
     * @param traceDestination output destination for fn:trace() calls
     * @throws Exception when any error occurs during a transformation
     */

    public void processDirectoryAssoc(List sources, File outputDir,
                                      ArrayList parameterList, String initialMode, PrintStream traceDestination)
            throws Exception {

        int failures = 0;
        for (int f = 0; f < sources.size(); f++) {
            Source source = (Source)sources.get(f);
            String localName = getLocalFileName(source);
            try {
                processFileAssoc(source, localName, outputDir, parameterList, initialMode, traceDestination);
            } catch (XPathException err) {
                failures++;
                System.err.println("While processing " + localName +
                        ": " + err.getMessage() + '\n');
            }
        }
        if (failures > 0) {
            throw new XPathException(failures + " transformation" +
                    (failures == 1 ? "" : "s") + " failed");
        }
    }

    /**
     * Make an output file in the output directory, with filename extension derived from the
     * media-type produced by the stylesheet
     *
     * @param directory The directory in which the file is to be created
     * @param localName The local name of the file within the
     *                  directory, excluding the file type suffix
     * @param sheet     The Templates object identifying the stylesheet -
     *                  used to determine the output method, and hence the suffix to be
     *                  used for the filename
     * @return The newly created file
     */

    private File makeOutputFile(File directory, String localName, Templates sheet) {
        String mediaType = sheet.getOutputProperties().getProperty(OutputKeys.MEDIA_TYPE);
        String suffix = ".xml";
        if ("text/html".equals(mediaType)) {
            suffix = ".html";
        } else if ("text/plain".equals(mediaType)) {
            suffix = ".txt";
        }
        String prefix = localName;
        if (localName.endsWith(".xml") || localName.endsWith(".XML")) {
            prefix = localName.substring(0, localName.length() - 4);
        }
        return new File(directory, prefix + suffix);
    }


    /**
     * Process a single source file using its associated stylesheet(s)
     *
     * @param sourceInput   Identifies the source file to be transformed
     * @param localName     The local name of the file within the
     *                      directory, excluding the file type suffix
     * @param outputFile    The output file to contain the results of the
     *                      transformation
     * @param parameterList List of parameters to be supplied to the
     *                      transformation
     * @param initialMode   Initial mode for executing the transformation
     * @param traceDestination Destination for trace output
     * @throws XPathException If the transformation fails
     */

    public void processFileAssoc(Source sourceInput, String localName, File outputFile,
                                 ArrayList parameterList, String initialMode, PrintStream traceDestination)
            throws TransformerException {
        if (showTime) {
            System.err.println("Processing " + sourceInput.getSystemId() + " using associated stylesheet");
        }
        long startTime = now();

        Source style = factory.getAssociatedStylesheet(sourceInput, null, null, null);
        Templates sheet = factory.newTemplates(style);
        if (showTime) {
            System.err.println("Prepared associated stylesheet " + style.getSystemId());
        }

        Controller controller =
                newController(sheet, parameterList, traceDestination, initialMode, null);

        File outFile = outputFile;

        if (outFile != null && outFile.isDirectory()) {
            outFile = makeOutputFile(outFile, localName, sheet);
        }

        StreamResult result =
                (outFile == null ? new StreamResult(System.out) : new StreamResult(outFile.toURI().toString()));

        try {
            controller.transform(sourceInput, result);
        } catch (TerminationException err) {
            throw err;
        } catch (XPathException err) {
            // The error message will already have been displayed; don't do it twice
            throw new XPathException("Run-time errors were reported");
        }

        if (showTime) {
            long endTime = now();
            System.err.println("Execution time: " + (endTime - startTime) + " milliseconds");
        }
    }

    /**
     * Create a new Controller. This method is protected so it can be overridden in a subclass, allowing additional
     * options to be set on the Controller
     * @param sheet The Templates object representing the compiled stylesheet
     * @param parameterList A list of "keyword=value" pairs representing parameter values, in their original
     * format from the command line, including any initial "+" or "!" qualifier
     * @param traceDestination destination for trace output
     * @param initialMode the initial mode for the transformation, as a Clark name. Can be null
     * @param initialTemplate the name of the initial template for the transformation, as a Clark name. Can be null
     * @return the newly constructed Controller to be used for the transformation
     * @throws TransformerException if any error occurs
     */

    protected Controller newController(
            Templates sheet, ArrayList parameterList, PrintStream traceDestination,
            String initialMode, String initialTemplate) throws TransformerException {
        Controller controller = (Controller)sheet.newTransformer();
        setParams(controller, parameterList);
        controller.setTraceFunctionDestination(traceDestination);
        if (initialMode != null) {
            controller.setInitialMode(initialMode);
        }
        if (initialTemplate != null) {
            controller.setInitialTemplate(initialTemplate);
        }
        return controller;
    }

    /**
     * Get current time in milliseconds
     * @return the current time in milliseconds since 1970
     */

    public static long now() {
        return System.currentTimeMillis();
    }

    /**
     * Process each file in the source directory using the same supplied stylesheet
     *
     * @param sources       The sources in the directory to be processed
     * @param sheet         The Templates object identifying the stylesheet
     * @param outputDir     The directory in which output files are to be
     *                      created
     * @param parameterList List of parameters to be supplied to each
     *                      transformation
     * @param initialTemplate Initial template for executing each
     *                      transformation
     * @param initialMode   Initial mode for executing each
     *                      transformation
     * @param traceDestination Destination for output from fn:trace() calls
     * @throws XPathException when any error occurs during a
     *                        transformation
     */

    public void processDirectory(List sources, Templates sheet, File outputDir, ArrayList parameterList,
                                 String initialTemplate, String initialMode, PrintStream traceDestination)
            throws TransformerException {
        int failures = 0;
        for (int f = 0; f < sources.size(); f++) {
            Source source = (Source)sources.get(f);
            String localName = getLocalFileName(source);
            try {
                File outputFile = makeOutputFile(outputDir, localName, sheet);
                processFile(source, sheet, outputFile, parameterList, initialTemplate, initialMode, traceDestination);
            } catch (XPathException err) {
                failures++;
                System.err.println("While processing " + localName + ": " + err.getMessage() + '\n');
            }
        }
        if (failures > 0) {
            throw new XPathException(failures + " transformation" +
                    (failures == 1 ? "" : "s") + " failed");
        }
    }

    private static String getLocalFileName(Source source) {
        try {
            String path = new URI(source.getSystemId()).getPath();
            while (true) {
                int sep = path.indexOf('/');
                if (sep < 0) {
                    return path;
                } else {
                    path = path.substring(sep + 1);
                }
            }
        } catch (URISyntaxException err) {
            throw new IllegalArgumentException(err.getMessage());
        }
    }

    /**
     * Process a single file using a supplied stylesheet
     *
     * @param source        The source XML document to be transformed (maybe null if an initial template
     *                      is specified)
     * @param sheet         The Templates object identifying the stylesheet
     * @param outputFile    The output file to contain the results of the
     *                      transformation
     * @param parameterList List of parameters to be supplied to the
     *                      transformation
     * @param initialTemplate Initial template for executing each
     *                      transformation
     * @param initialMode   Initial mode for executing the transformation
     * @param traceDestination Destination for output from fn:trace() function
     * @throws org.pdf4j.saxon.trans.XPathException
     *          If the transformation fails
     */

    public void processFile(Source source, Templates sheet, File outputFile, ArrayList parameterList,
                            String initialTemplate, String initialMode, PrintStream traceDestination)
            throws TransformerException {

        long totalTime = 0;
        int runs = 0;
        for (int r = 0; r < repeat; r++) {      // repeat is for internal testing/timing
            if (showTime) {
                String msg = "Processing ";
                if (source != null) {
                    msg += source.getSystemId();
                } else {
                    msg += " (no source document)";
                }
                if (initialMode != null) {
                    msg += " initial mode = " + initialMode;
                }
                if (initialTemplate != null) {
                    msg += " initial template = " + initialTemplate;
                }
                System.err.println(msg);
            }
            long startTime = now();
            runs++;
            Controller controller =
                    newController(sheet, parameterList, traceDestination, initialMode, initialTemplate);

            Result result =
                    (outputFile == null ?
                    new StreamResult(System.out) :
                    new StreamResult(outputFile.toURI().toString()));

            try {
                controller.transform(source, result);
            } catch (TerminationException err) {
                throw err;
            } catch (XPathException err) {
                // The message will already have been displayed; don't do it twice
                if (!err.hasBeenReported()) {
                    err.printStackTrace();
                }
                throw new XPathException("Run-time errors were reported");
            }

            long endTime = now();
            totalTime += (endTime - startTime);
            if (showTime) {
                System.err.println("Execution time: " + (endTime - startTime) + " milliseconds");
                System.err.println("Memory used: " + (Runtime.getRuntime().totalMemory() - Runtime.getRuntime().freeMemory()));
                config.getNamePool().statistics();
                if (repeat > 1) {
                    System.err.println("-------------------------------");
                    Runtime.getRuntime().gc();
                }
            }
            if (repeat == 999999 && totalTime > 60000) {
                break;
            }
        }
        if (repeat > 1) {
            System.err.println("*** Average execution time over " + runs + " runs: " + (totalTime / runs) + "ms");
        }
    }

    /**
     * Supply the requested parameters to the transformer. This method is protected so that it can
     * be overridden in a subclass.
     *
     * @param controller  The controller to be used for the transformation
     * @param parameterList A list of "keyword=value" pairs representing parameter values, in their original
     * format from the command line, including any initial "+" or "!" qualifier
     */
    protected void setParams(Controller controller, ArrayList parameterList)
            throws TransformerException {
        for (int i = 0; i < parameterList.size(); i++) {
            String arg = (String)parameterList.get(i);
            int eq = arg.indexOf("=");
            String argname = arg.substring(0, eq);
            String argvalue = (eq == arg.length()-1 ? "" : arg.substring(eq + 1));
            if (argname.startsWith("!")) {
                // parameters starting with "!" are taken as output properties
                controller.setOutputProperty(argname.substring(1), argvalue);
            } else if (argname.startsWith("+")) {
                // parameters starting with "+" are taken as input documents
                Object sources = loadDocuments(argvalue, useURLs, config, true);
                controller.setParameter(argname.substring(1), sources);
            } else {
                controller.setParameter(argname, new UntypedAtomicValue(argvalue));
            }
        }
    }

    /**
     * Report incorrect usage of the command line, with a list of the options and arguments that are available
     *
     * @param name    The name of the command being executed (allows subclassing)
     * @param message The error message
     */
    protected void badUsage(String name, String message) {
        if (!"".equals(message)) {
            System.err.println(message);
        }
        if (!showTime) {
            System.err.println(config.getProductTitle());
        }
        System.err.println("Usage: see http://www.saxonica.com/documentation/using-xsl/commandline.html");
        System.err.println("Options: ");
        System.err.println("  -a                    Use xml-stylesheet PI, not style-doc argument");
        System.err.println("  -c:filename           Use compiled stylesheet from file");
        System.err.println("  -cr:classname         Use collection URI resolver class");
        System.err.println("  -dtd:on|off           Validate using DTD");
        System.err.println("  -expand:on|off        Expand defaults defined in schema/DTD");
        System.err.println("  -explain[:filename]   Display compiled expression tree");
        System.err.println("  -ext:on|off           Allow|Disallow external Java functions");
        System.err.println("  -im:modename          Initial mode");
        System.err.println("  -it:template          Initial template");
        System.err.println("  -l:on|off             Line numbering for source document");
        System.err.println("  -m:classname          Use message receiver class");
        System.err.println("  -o:filename           Output file or directory");
        System.err.println("  -or:classname         Use OutputURIResolver class");
        System.err.println("  -outval:recover|fatal Handling of validation errors on result document");
        System.err.println("  -p:on|off             Recognize URI query parameters");
        System.err.println("  -r:classname          Use URIResolver class");
        System.err.println("  -repeat:N             Repeat N times for performance measurement");
        System.err.println("  -s:filename           Initial source document");
        System.err.println("  -sa                   Schema-aware transformation");
        System.err.println("  -strip:all|none|ignorable      Strip whitespace text nodes");
        System.err.println("  -t                    Display version and timing information");
        System.err.println("  -T[:classname]        Use TraceListener class");
        System.err.println("  -TJ                   Trace calls to external Java functions");
        System.err.println("  -tree:tiny|linked     Select tree model");
        System.err.println("  -traceout:file|#null  Destination for fn:trace() output");
        System.err.println("  -u                    Names are URLs not filenames");
        System.err.println("  -val:strict|lax       Validate using schema");
        System.err.println("  -versionmsg:on|off    Warn when using XSLT 1.0 stylesheet");
        System.err.println("  -warnings:silent|recover|fatal  Handling of recoverable errors");
        System.err.println("  -x:classname          Use specified SAX parser for source file");
        System.err.println("  -xi:on|off            Expand XInclude on all documents");
        System.err.println("  -xmlversion:1.0|1.1   Version of XML to be handled");
        System.err.println("  -xsd:file;file..      Additional schema documents to be loaded");
        System.err.println("  -xsdversion:1.0|1.1   Version of XML Schema to be used");
        System.err.println("  -xsiloc:on|off        Take note of xsi:schemaLocation");
        System.err.println("  -xsl:filename         Stylesheet file");
        System.err.println("  -y:classname          Use specified SAX parser for stylesheet");
        System.err.println("  -?                    Display this message ");
        System.err.println("  param=value           Set stylesheet string parameter");
        System.err.println("  +param=filename       Set stylesheet document parameter");
        System.err.println("  !option=value         Set serialization option");
        if ("".equals(message)) {
            System.exit(0);
        } else {
            System.exit(2);
        }
    }

}

//
// The contents of this file are subject to the Mozilla Public License Version 1.0 (the "License");
// you may not use this file except in compliance with the License. You may obtain a copy of the
// License at http://www.mozilla.org/MPL/
//
// Software distributed under the License is distributed on an "AS IS" basis,
// WITHOUT WARRANTY OF ANY KIND, either express or implied.
// See the License for the specific language governing rights and limitations under the License.
//
// The Original Code is: all this file.
//
// The Initial Developer of the Original Code is Michael H. Kay.
//
// Portions created by (your name) are Copyright (C) (your legal entity). All Rights Reserved.
//
// Contributor(s): changes to allow source and/or stylesheet from stdin contributed by
// Gunther Schadow [gunther@aurora.regenstrief.org]
//
TOP

Related Classes of org.pdf4j.saxon.Transform

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.