/* Copyright 2002-2005 Elliotte Rusty Harold
This library is free software; you can redistribute it and/or modify
it under the terms of version 2.1 of the GNU Lesser General Public
License as published by the Free Software Foundation.
This library is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU Lesser General Public License for more details.
You should have received a copy of the GNU Lesser General Public
License along with this library; if not, write to the
Free Software Foundation, Inc., 59 Temple Place, Suite 330,
Boston, MA 02111-1307 USA
You can contact Elliotte Rusty Harold by sending e-mail to
elharo@metalab.unc.edu. Please include the word "XOM" in the
subject line. The XOM home page is located at http://www.xom.nu/
*/
package nu.xom.converters;
import nu.xom.Attribute;
import nu.xom.Comment;
import nu.xom.DocType;
import nu.xom.Document;
import nu.xom.Element;
import nu.xom.Node;
import nu.xom.Nodes;
import nu.xom.ParentNode;
import nu.xom.ProcessingInstruction;
import nu.xom.Text;
import org.xml.sax.ContentHandler;
import org.xml.sax.SAXException;
import org.xml.sax.ext.LexicalHandler;
import org.xml.sax.helpers.AttributesImpl;
import org.xml.sax.helpers.LocatorImpl;
/**
* <p>
* Feeds a XOM <code>Document</code> into a
* SAX2 <code>ContentHandler</code>.
* </p>
*
* @author Elliotte Rusty Harold
* @version 1.1b2
*/
public class SAXConverter {
private ContentHandler contentHandler;
private LexicalHandler lexicalHandler;
private LocatorImpl locator;
private boolean stripBaseAttributes = true;
/**
* <p>
* Creates a new <code>SAXConverter</code>.
* </p>
*
* @param handler the SAX2 content handler
* that receives the data
*
* @throws NullPointerException if handler is null
*
*/
public SAXConverter(ContentHandler handler) {
setContentHandler(handler);
}
/**
* <p>
* Set the content handler for this converter.
* </p>
*
* @param handler SAX2 content handler that
* receives the data
*
* @throws NullPointerException if handler is null
*
*/
public void setContentHandler(ContentHandler handler) {
if (handler == null) {
throw new NullPointerException(
"ContentHandler must be non-null."
);
}
// unbelievably skanky hack to allow xml:base attributes
// to be passed to XSL transforms without mucking with the
// public API. This would be so much easier if Java had friend
// functions.
else if ("nu.xom.xslt.XSLTHandler".equals(handler.getClass().getName())) {
this.stripBaseAttributes = false;
}
else {
this.contentHandler = handler;
}
}
/**
* <p>
* Returns the content handler.
* </p>
*
* @return SAX2 content handler that receives the data
*/
public ContentHandler getContentHandler() {
return this.contentHandler;
}
/**
* <p>
* Sets the optional lexical handler for this converter.
* The only lexical events the converter supplies
* are comments.
* </p>
*
* @param handler the lexical handler;
* may be null to turn off lexical events
*/
public void setLexicalHandler(LexicalHandler handler) {
this.lexicalHandler = handler;
}
/**
* <p>
* Returns the <code>LexicalHandler</code> for this
* converter. This is only used for comments.
* </p>
*
* @return SAX2 lexical handler that receives
* lexical events
*/
public LexicalHandler getLexicalHandler() {
return this.lexicalHandler;
}
// Not necessary to worry about parser exceptions passed to
// fatalError() because we're starting with a known good document.
// Only exceptions that can arise are thrown by
// the supplied ContentHandler, and we don't want to pass those
// to the ErrorHandler, or call endDocument() if such an exception
// is thrown
/**
* <p>
* Feed a document through this converter.
* </p>
*
* @param doc the document to pass to SAX
*
* @throws SAXException if the content handler
* or lexical handler throws an exception
*/
public void convert(Document doc) throws SAXException {
locator = new LocatorImpl();
locator.setSystemId(doc.getBaseURI());
contentHandler.setDocumentLocator(locator);
contentHandler.startDocument();
for (int i = 0; i < doc.getChildCount(); i++) {
process(doc.getChild(i));
}
contentHandler.endDocument();
}
private void process(Node node) throws SAXException {
if (node instanceof Element) {
convertElement((Element) node);
}
else if (node instanceof Text) {
String data = node.getValue();
contentHandler.characters(
data.toCharArray(), 0, data.length());
}
else if (node instanceof ProcessingInstruction) {
ProcessingInstruction instruction
= (ProcessingInstruction) node;
contentHandler.processingInstruction(
instruction.getTarget(), instruction.getValue());
}
else if (node instanceof Comment && lexicalHandler != null) {
String data = node.getValue();
lexicalHandler.comment(
data.toCharArray(), 0, data.length());
}
else if (node instanceof DocType && lexicalHandler != null) {
DocType type = (DocType) node;
lexicalHandler.startDTD(type.getRootElementName(),
type.getPublicID(), type.getSystemID());
lexicalHandler.endDTD();
}
// all other types are ignored
}
/**
* @param element the context in which the prefix is mapped
* @param prefix the prefix to pass to statPrefixMapping
* @return true if and only if startPrefixMapping was called
* @throws SAXException if the ContentHandler throws an exception
*/
private boolean convertNamespace(Element element, String prefix)
throws SAXException {
// XXX could store a stack of these in a namespaceSupport to avoid going up to the parent
String uri = element.getNamespaceURI(prefix);
ParentNode parentNode = element.getParent();
Element parent = null;
if (parentNode instanceof Element) {
parent = (Element) parentNode;
}
if (parent != null && uri.equals(parent.getNamespaceURI(prefix))) {
return false;
}
else if (parent == null && "".equals(uri)) {
// Do not fire startPrefixMapping event for no namespace
// on root element
return false;
}
contentHandler.startPrefixMapping(prefix, uri);
return true; // i.e. converted
}
private void convertElement(Element element) throws SAXException {
locator.setSystemId(element.getBaseURI());
// start prefix mapping
int namespaceCount = element.getNamespaceDeclarationCount();
String[] prefixes = new String[namespaceCount];
int prefixCount = 0;
for (int i = 0; i < namespaceCount; i++) {
String prefix = element.getNamespacePrefix(i);
boolean converted = convertNamespace(element, prefix);
if (converted) {
prefixes[prefixCount] = prefix;
prefixCount++;
}
}
// prepare attributes
AttributesImpl saxAttributes = new AttributesImpl();
int attributeCount = element.getAttributeCount();
for (int i = 0; i < attributeCount; i++) {
Attribute attribute = element.getAttribute(i);
// The base URIs provided by the locator have already
// accounted for any xml:base attributes. We do not
// also pass in xml:base attributes or some relative base
// URIs could be applied twice.
if ("base".equals(attribute.getLocalName())
&& "http://www.w3.org/XML/1998/namespace".equals(attribute.getNamespaceURI())
&& stripBaseAttributes) {
continue;
}
saxAttributes.addAttribute(attribute.getNamespaceURI(),
attribute.getLocalName(),
attribute.getQualifiedName(),
getSAXType(attribute),
attribute.getValue());
}
contentHandler.startElement(
element.getNamespaceURI(),
element.getLocalName(),
element.getQualifiedName(),
saxAttributes);
int childCount = element.getChildCount();
for (int i = 0; i < childCount; i++) {
process(element.getChild(i));
}
contentHandler.endElement(element.getNamespaceURI(),
element.getLocalName(), element.getQualifiedName());
// end prefix mappings
for (int i = 0; i < prefixCount; i++) {
contentHandler.endPrefixMapping(prefixes[i]);
}
}
private static String getSAXType(Attribute attribute) {
Attribute.Type type = attribute.getType();
if (type.equals(Attribute.Type.UNDECLARED)) return "CDATA";
if (type.equals(Attribute.Type.CDATA)) return "CDATA";
if (type.equals(Attribute.Type.ID)) return "ID";
if (type.equals(Attribute.Type.IDREF)) return "IDREF";
if (type.equals(Attribute.Type.IDREFS)) return "IDREFS";
if (type.equals(Attribute.Type.NMTOKEN)) return "NMTOKEN";
if (type.equals(Attribute.Type.NMTOKENS)) return "NMTOKENS";
if (type.equals(Attribute.Type.ENTITY)) return "ENTITY";
if (type.equals(Attribute.Type.ENTITIES)) return "ENTITIES";
if (type.equals(Attribute.Type.NOTATION)) return "NOTATION";
return "NMTOKEN"; // ENUMERATED
}
/**
* <p>
* Converts a <code>Nodes</code> list into SAX by firing events
* into the registered handlers. This method calls
* <code>startDocument</code> before processing the list
* of nodes, and calls <code>endDocument</code> after processing
* all of them.
* </p>
*
* @param nodes the nodes to pass to SAX
*
* @throws SAXException if the content handler
* or lexical handler throws an exception
*/
public void convert(Nodes nodes) throws SAXException {
if (nodes.size() == 1 && nodes.get(0) instanceof Document) {
convert((Document) nodes.get(0));
}
else {
locator = new LocatorImpl();
contentHandler.setDocumentLocator(locator);
contentHandler.startDocument();
for (int i = 0; i < nodes.size(); i++) {
process(nodes.get(i));
}
contentHandler.endDocument();
}
}
}