/* Copyright 2002-2005 Elliotte Rusty Harold
   
   This library is free software; you can redistribute it and/or modify
   it under the terms of version 2.1 of the GNU Lesser General Public 
   License as published by the Free Software Foundation.
   
   This library is distributed in the hope that it will be useful,
   but WITHOUT ANY WARRANTY; without even the implied warranty of
   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
   GNU Lesser General Public License for more details.
   
   You should have received a copy of the GNU Lesser General Public
   License along with this library; if not, write to the 
   Free Software Foundation, Inc., 59 Temple Place, Suite 330, 
   Boston, MA 02111-1307  USA
   
   You can contact Elliotte Rusty Harold by sending e-mail to
   elharo@ibiblio.org. Please include the word "XOM" in the
   subject line. The XOM home page is located at http://www.xom.nu/
*/

package nu.xom.converters;

import nu.xom.Attribute;
import nu.xom.Comment;
import nu.xom.DocType;
import nu.xom.Document;
import nu.xom.Element;
import nu.xom.Node;
import nu.xom.Nodes;
import nu.xom.ParentNode;
import nu.xom.ProcessingInstruction;
import nu.xom.Text;

import org.xml.sax.ContentHandler;
import org.xml.sax.SAXException;
import org.xml.sax.ext.LexicalHandler;
import org.xml.sax.helpers.AttributesImpl;
import org.xml.sax.helpers.LocatorImpl;

Feeds a XOM Document into a SAX2 ContentHandler.

Author:Elliotte Rusty Harold
Version:1.1b2
/** * <p> * Feeds a XOM <code>Document</code> into a * SAX2 <code>ContentHandler</code>. * </p> * * @author Elliotte Rusty Harold * @version 1.1b2 */
public class SAXConverter { private ContentHandler contentHandler; private LexicalHandler lexicalHandler; private LocatorImpl locator; private boolean stripBaseAttributes = true;

Creates a new SAXConverter.

Params:
  • handler – the SAX2 content handler that receives the data
Throws:
/** * <p> * Creates a new <code>SAXConverter</code>. * </p> * * @param handler the SAX2 content handler * that receives the data * * @throws NullPointerException if handler is null * */
public SAXConverter(ContentHandler handler) { setContentHandler(handler); }

Set the content handler for this converter.

Params:
  • handler – SAX2 content handler that receives the data
Throws:
/** * <p> * Set the content handler for this converter. * </p> * * @param handler SAX2 content handler that * receives the data * * @throws NullPointerException if handler is null * */
public void setContentHandler(ContentHandler handler) { if (handler == null) { throw new NullPointerException( "ContentHandler must be non-null." ); } // unbelievably skanky hack to allow xml:base attributes // to be passed to XSL transforms without mucking with the // public API. This would be so much easier if Java had friend // functions. else if ("nu.xom.xslt.XSLTHandler".equals(handler.getClass().getName())) { this.stripBaseAttributes = false; } else { this.contentHandler = handler; } }

Returns the content handler.

Returns:SAX2 content handler that receives the data
/** * <p> * Returns the content handler. * </p> * * @return SAX2 content handler that receives the data */
public ContentHandler getContentHandler() { return this.contentHandler; }

Sets the optional lexical handler for this converter. The only lexical events the converter supplies are comments.

Params:
  • handler – the lexical handler; may be null to turn off lexical events
/** * <p> * Sets the optional lexical handler for this converter. * The only lexical events the converter supplies * are comments. * </p> * * @param handler the lexical handler; * may be null to turn off lexical events */
public void setLexicalHandler(LexicalHandler handler) { this.lexicalHandler = handler; }

Returns the LexicalHandler for this converter. This is only used for comments.

Returns:SAX2 lexical handler that receives lexical events
/** * <p> * Returns the <code>LexicalHandler</code> for this * converter. This is only used for comments. * </p> * * @return SAX2 lexical handler that receives * lexical events */
public LexicalHandler getLexicalHandler() { return this.lexicalHandler; } // Not necessary to worry about parser exceptions passed to // fatalError() because we're starting with a known good document. // Only exceptions that can arise are thrown by // the supplied ContentHandler, and we don't want to pass those // to the ErrorHandler, or call endDocument() if such an exception // is thrown

Feed a document through this converter.

Params:
  • doc – the document to pass to SAX
Throws:
  • SAXException – if the content handler or lexical handler throws an exception
/** * <p> * Feed a document through this converter. * </p> * * @param doc the document to pass to SAX * * @throws SAXException if the content handler * or lexical handler throws an exception */
public void convert(Document doc) throws SAXException { locator = new LocatorImpl(); locator.setSystemId(doc.getBaseURI()); contentHandler.setDocumentLocator(locator); contentHandler.startDocument(); for (int i = 0; i < doc.getChildCount(); i++) { process(doc.getChild(i)); } contentHandler.endDocument(); } private void process(Node node) throws SAXException { if (node instanceof Element) { convertElement((Element) node); } else if (node instanceof Text) { String data = node.getValue(); contentHandler.characters( data.toCharArray(), 0, data.length()); } else if (node instanceof ProcessingInstruction) { ProcessingInstruction instruction = (ProcessingInstruction) node; contentHandler.processingInstruction( instruction.getTarget(), instruction.getValue()); } else if (node instanceof Comment && lexicalHandler != null) { String data = node.getValue(); lexicalHandler.comment( data.toCharArray(), 0, data.length()); } else if (node instanceof DocType && lexicalHandler != null) { DocType type = (DocType) node; lexicalHandler.startDTD(type.getRootElementName(), type.getPublicID(), type.getSystemID()); lexicalHandler.endDTD(); } // all other types are ignored }
Params:
  • element – the context in which the prefix is mapped
  • prefix – the prefix to pass to statPrefixMapping
Throws:
Returns:true if and only if startPrefixMapping was called
/** * @param element the context in which the prefix is mapped * @param prefix the prefix to pass to statPrefixMapping * @return true if and only if startPrefixMapping was called * @throws SAXException if the ContentHandler throws an exception */
private boolean convertNamespace(Element element, String prefix) throws SAXException { // XXX could store a stack of these in a namespaceSupport to avoid going up to the parent String uri = element.getNamespaceURI(prefix); ParentNode parentNode = element.getParent(); Element parent = null; if (parentNode instanceof Element) { parent = (Element) parentNode; } if (parent != null && uri.equals(parent.getNamespaceURI(prefix))) { return false; } else if (parent == null && "".equals(uri)) { // Do not fire startPrefixMapping event for no namespace // on root element return false; } contentHandler.startPrefixMapping(prefix, uri); return true; // i.e. converted } private void convertElement(Element element) throws SAXException { locator.setSystemId(element.getBaseURI()); // start prefix mapping int namespaceCount = element.getNamespaceDeclarationCount(); String[] prefixes = new String[namespaceCount]; int prefixCount = 0; for (int i = 0; i < namespaceCount; i++) { String prefix = element.getNamespacePrefix(i); boolean converted = convertNamespace(element, prefix); if (converted) { prefixes[prefixCount] = prefix; prefixCount++; } } // prepare attributes AttributesImpl saxAttributes = new AttributesImpl(); int attributeCount = element.getAttributeCount(); for (int i = 0; i < attributeCount; i++) { Attribute attribute = element.getAttribute(i); // The base URIs provided by the locator have already // accounted for any xml:base attributes. We do not // also pass in xml:base attributes or some relative base // URIs could be applied twice. if ("base".equals(attribute.getLocalName()) && "http://www.w3.org/XML/1998/namespace".equals(attribute.getNamespaceURI()) && stripBaseAttributes) { continue; } saxAttributes.addAttribute(attribute.getNamespaceURI(), attribute.getLocalName(), attribute.getQualifiedName(), getSAXType(attribute), attribute.getValue()); } contentHandler.startElement( element.getNamespaceURI(), element.getLocalName(), element.getQualifiedName(), saxAttributes); int childCount = element.getChildCount(); for (int i = 0; i < childCount; i++) { process(element.getChild(i)); } contentHandler.endElement(element.getNamespaceURI(), element.getLocalName(), element.getQualifiedName()); // end prefix mappings for (int i = 0; i < prefixCount; i++) { contentHandler.endPrefixMapping(prefixes[i]); } } private static String getSAXType(Attribute attribute) { Attribute.Type type = attribute.getType(); if (type.equals(Attribute.Type.UNDECLARED)) return "CDATA"; if (type.equals(Attribute.Type.CDATA)) return "CDATA"; if (type.equals(Attribute.Type.ID)) return "ID"; if (type.equals(Attribute.Type.IDREF)) return "IDREF"; if (type.equals(Attribute.Type.IDREFS)) return "IDREFS"; if (type.equals(Attribute.Type.NMTOKEN)) return "NMTOKEN"; if (type.equals(Attribute.Type.NMTOKENS)) return "NMTOKENS"; if (type.equals(Attribute.Type.ENTITY)) return "ENTITY"; if (type.equals(Attribute.Type.ENTITIES)) return "ENTITIES"; if (type.equals(Attribute.Type.NOTATION)) return "NOTATION"; return "NMTOKEN"; // ENUMERATED }

Converts a Nodes list into SAX by firing events into the registered handlers. This method calls startDocument before processing the list of nodes, and calls endDocument after processing all of them.

Params:
  • nodes – the nodes to pass to SAX
Throws:
  • SAXException – if the content handler or lexical handler throws an exception
/** * <p> * Converts a <code>Nodes</code> list into SAX by firing events * into the registered handlers. This method calls * <code>startDocument</code> before processing the list * of nodes, and calls <code>endDocument</code> after processing * all of them. * </p> * * @param nodes the nodes to pass to SAX * * @throws SAXException if the content handler * or lexical handler throws an exception */
public void convert(Nodes nodes) throws SAXException { if (nodes.size() == 1 && nodes.get(0) instanceof Document) { convert((Document) nodes.get(0)); } else { locator = new LocatorImpl(); contentHandler.setDocumentLocator(locator); contentHandler.startDocument(); for (int i = 0; i < nodes.size(); i++) { process(nodes.get(i)); } contentHandler.endDocument(); } } }