org.jdom2.input.DOMBuilder.java Source code

Java tutorial

Introduction

Here is the source code for org.jdom2.input.DOMBuilder.java

Source

/*--
    
 Copyright (C) 2000-2012 Jason Hunter & Brett McLaughlin.
 All rights reserved.
    
 Redistribution and use in source and binary forms, with or without
 modification, are permitted provided that the following conditions
 are met:
    
 1. Redistributions of source code must retain the above copyright
notice, this list of conditions, and the following disclaimer.
    
 2. Redistributions in binary form must reproduce the above copyright
notice, this list of conditions, and the disclaimer that follows
these conditions in the documentation and/or other materials
provided with the distribution.
    
 3. The name "JDOM" must not be used to endorse or promote products
derived from this software without prior written permission.  For
written permission, please contact <request_AT_jdom_DOT_org>.
    
 4. Products derived from this software may not be called "JDOM", nor
may "JDOM" appear in their name, without prior written permission
from the JDOM Project Management <request_AT_jdom_DOT_org>.
    
 In addition, we request (but do not require) that you include in the
 end-user documentation provided with the redistribution and/or in the
 software itself an acknowledgement equivalent to the following:
 "This product includes software developed by the
  JDOM Project (http://www.jdom.org/)."
 Alternatively, the acknowledgment may be graphical using the logos
 available at http://www.jdom.org/images/logos.
    
 THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
 WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 DISCLAIMED.  IN NO EVENT SHALL THE JDOM AUTHORS OR THE PROJECT
 CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
 USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
 OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 SUCH DAMAGE.
    
 This software consists of voluntary contributions made by many
 individuals on behalf of the JDOM Project and was originally
 created by Jason Hunter <jhunter_AT_jdom_DOT_org> and
 Brett McLaughlin <brett_AT_jdom_DOT_org>.  For more information
 on the JDOM Project, please see <http://www.jdom.org/>.
    
 */

package org.jdom2.input;

/*
 * To keep things simple, all DOM-based items are fully qualified in this code.
 * As such, there are no import org.w3c.dom.* statements...
 * This way there isless confusion about what a Document or Element is....
 */

import static org.jdom2.JDOMConstants.*;

import java.util.HashMap;

import org.jdom2.Attribute;
import org.jdom2.DefaultJDOMFactory;
import org.jdom2.DocType;
import org.jdom2.Document;
import org.jdom2.Element;
import org.jdom2.JDOMFactory;
import org.jdom2.Namespace;

/**
 * Builds a JDOM Document from a pre-existing DOM {@link org.w3c.dom.Document 
 * org.w3c.dom.Document}.
 * <p>
 * If you are building a document that has Namespace declarations, you should
 * ensure that the Namespaces are correctly recorded in the DOM document before
 * building the JDOM document from the DOM. By default, the native Java
 * DOMBuilderFactory is configured to ignore Namespaces, and thus they are
 * 'lost' in the DOM tree. JDOM expects Namespace-aware documents, so you
 * should ensure that you change the default settings on the
 * DOMBuilderFactory before parsing the DOM document. For example:
 * <p>
 * <pre>
 *     DocumentBuilderFactory domfactory = DocumentBuilderFactory.newInstance();
 *     domfactory.setNamespaceAware(true);
 *     DocumentBuilder dombuilder = domfac.newDocumentBuilder();
 *     org.w3c.dom.Document doc = dombuilder.parse(....);
 * </pre>
 * 
 * @author  Brett McLaughlin
 * @author  Jason Hunter
 * @author  Philip Nelson
 * @author  Kevin Regan
 * @author  Yusuf Goolamabbas
 * @author  Dan Schaffer
 * @author  Bradley S. Huffman
 */
public class DOMBuilder {

    /** The factory for creating new JDOM objects */
    private JDOMFactory factory = new DefaultJDOMFactory();

    /**
     * This creates a new DOMBuilder instance using the DefaultJDOMFactory
     * to build the JDOM content.
     */
    public DOMBuilder() {
    }

    /**
     * This sets a custom JDOMFactory for the builder.  Use this to build
     * the tree with your own subclasses of the JDOM classes.
     *
     * @param factory <code>JDOMFactory</code> to use
     */
    public void setFactory(JDOMFactory factory) {
        this.factory = factory;
    }

    /**
     * Returns the current {@link org.jdom2.JDOMFactory} in use.
     * @return the factory in use
     */
    public JDOMFactory getFactory() {
        return factory;
    }

    /**
     * This will build a JDOM tree from an existing DOM tree.
     *
     * @param domDocument <code>org.w3c.dom.Document</code> object
     * @return <code>Document</code> - JDOM document object.
     */
    public Document build(org.w3c.dom.Document domDocument) {
        Document doc = factory.document(null);
        buildTree(domDocument, doc, null, true);
        return doc;
    }

    /**
     * This will build a JDOM Element from an existing DOM Element
     *
     * @param domElement <code> org.w3c.dom.Element</code> object
     * @return <code>Element</code> - JDOM Element object
     */
    public org.jdom2.Element build(org.w3c.dom.Element domElement) {
        Document doc = factory.document(null);
        buildTree(domElement, doc, null, true);
        return doc.getRootElement();
    }

    /**
     * This will build a JDOM CDATA from an existing DOM CDATASection
     *
     * @param cdata <code> org.w3c.dom.CDATASection</code> object
     * @return <code>CDATA</code> - JDOM CDATA object
     * @since JDOM2
     */
    public org.jdom2.CDATA build(org.w3c.dom.CDATASection cdata) {
        return factory.cdata(cdata.getNodeValue());
    }

    /**
     * This will build a JDOM Text from an existing DOM Text
     *
     * @param text <code> org.w3c.dom.Text</code> object
     * @return <code>Text</code> - JDOM Text object
     * @since JDOM2
     */
    public org.jdom2.Text build(org.w3c.dom.Text text) {
        return factory.text(text.getNodeValue());
    }

    /**
     * This will build a JDOM Comment from an existing DOM Comment
     *
     * @param comment <code> org.w3c.dom.Comment</code> object
     * @return <code>Comment</code> - JDOM Comment object
     * @since JDOM2
     */
    public org.jdom2.Comment build(org.w3c.dom.Comment comment) {
        return factory.comment(comment.getNodeValue());
    }

    /**
     * This will build a JDOM ProcessingInstruction from an existing DOM ProcessingInstruction
     *
     * @param pi <code> org.w3c.dom.ProcessingInstruction</code> object
     * @return <code>ProcessingInstruction</code> - JDOM ProcessingInstruction object
     * @since JDOM2
     */
    public org.jdom2.ProcessingInstruction build(org.w3c.dom.ProcessingInstruction pi) {
        return factory.processingInstruction(pi.getTarget(), pi.getData());
    }

    /**
     * This will build a JDOM EntityRef from an existing DOM EntityReference
     *
     * @param er <code> org.w3c.dom.EntityReference</code> object
     * @return <code>EnityRef</code> - JDOM EntityRef object
     * @since JDOM2
     */
    public org.jdom2.EntityRef build(org.w3c.dom.EntityReference er) {
        return factory.entityRef(er.getNodeName());
    }

    /**
     * This will build a JDOM Element from an existing DOM Element
     *
     * @param doctype <code> org.w3c.dom.Element</code> object
     * @return <code>Element</code> - JDOM Element object
     * @since JDOM2
     */
    public org.jdom2.DocType build(org.w3c.dom.DocumentType doctype) {
        String publicID = doctype.getPublicId();
        String systemID = doctype.getSystemId();
        String internalDTD = doctype.getInternalSubset();

        DocType docType = factory.docType(doctype.getName());
        docType.setPublicID(publicID);
        docType.setSystemID(systemID);
        docType.setInternalSubset(internalDTD);
        return docType;
    }

    /**
     * This takes a DOM <code>Node</code> and builds up
     * a JDOM tree, recursing until the DOM tree is exhausted
     * and the JDOM tree results.
     *
     * @param node <code>Code</node> to examine.
     * @param doc JDOM <code>Document</code> being built.
     * @param current <code>Element</code> that is current parent.
     * @param atRoot <code>boolean</code> indicating whether at root level.
     */
    private void buildTree(org.w3c.dom.Node node, Document doc, Element current, boolean atRoot) {
        // Recurse through the tree
        switch (node.getNodeType()) {
        case org.w3c.dom.Node.DOCUMENT_NODE:
            org.w3c.dom.NodeList nodes = node.getChildNodes();
            for (int i = 0, size = nodes.getLength(); i < size; i++) {
                buildTree(nodes.item(i), doc, current, true);
            }
            break;

        case org.w3c.dom.Node.ELEMENT_NODE:
            String nodeName = node.getNodeName();
            String prefix = NS_PREFIX_DEFAULT;
            String localName = nodeName;
            int colon = nodeName.indexOf(':');
            if (colon >= 0) {
                prefix = nodeName.substring(0, colon);
                localName = nodeName.substring(colon + 1);
            }

            // Get element's namespace
            Namespace ns = null;
            String uri = node.getNamespaceURI();
            if (uri == null) {
                ns = (current == null) ? Namespace.NO_NAMESPACE : current.getNamespace(prefix);
            } else {
                ns = Namespace.getNamespace(prefix, uri);
            }

            Element element = factory.element(localName, ns);

            if (atRoot) {
                // If at root, set as document root
                factory.setRoot(doc, element);
            } else {
                // else add to parent element
                factory.addContent(current, element);
            }

            // Add namespaces
            org.w3c.dom.NamedNodeMap attributeList = node.getAttributes();
            int attsize = attributeList.getLength();

            for (int i = 0; i < attsize; i++) {
                org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);

                String attname = att.getName();
                if (attname.startsWith(NS_PREFIX_XMLNS)) {
                    String attPrefix = NS_PREFIX_DEFAULT;
                    colon = attname.indexOf(':');
                    if (colon >= 0) {
                        attPrefix = attname.substring(colon + 1);
                    }

                    String attvalue = att.getValue();

                    Namespace declaredNS = Namespace.getNamespace(attPrefix, attvalue);

                    // Add as additional namespaces if it's different
                    // to this element's namespace (perhaps we should
                    // also have logic not to mark them as additional if
                    // it's been done already, but it probably doesn't
                    // matter)
                    if (prefix.equals(attPrefix)) {
                        // RL: note, it should also be true that uri.equals(attvalue)
                        // if not, then the parser is boken.
                        // further, declaredNS should be exactly the same as ns
                        // so the following should in fact do nothing.
                        element.setNamespace(declaredNS);
                    } else {
                        factory.addNamespaceDeclaration(element, declaredNS);
                    }
                }
            }

            // Add attributes
            for (int i = 0; i < attsize; i++) {
                org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);

                String attname = att.getName();

                if (!attname.startsWith(NS_PREFIX_XMLNS)) {
                    String attPrefix = NS_PREFIX_DEFAULT;
                    String attLocalName = attname;
                    colon = attname.indexOf(':');
                    if (colon >= 0) {
                        attPrefix = attname.substring(0, colon);
                        attLocalName = attname.substring(colon + 1);
                    }

                    String attvalue = att.getValue();

                    // Get attribute's namespace
                    Namespace attNS = null;
                    String attURI = att.getNamespaceURI();
                    if (attPrefix.isEmpty() && (attURI == null || NS_URI_DEFAULT.equals(attURI))) {
                        attNS = Namespace.NO_NAMESPACE;
                    } else {
                        // various conditions can lead here.
                        // the logical one is that we have a prefix for the
                        // attribute, and also a namespace URI.
                        // The alternative to that is in some conditions,
                        // the parser could have a 'default' or 'fixed'
                        // attribute that comes from an XSD used for
                        // validation. In that case there may not be a prefix
                        // There's also the possibility the DOM contains
                        // garbage.
                        if (attPrefix.length() > 0) {
                            // If the att has a prefix, we can assume that
                            // the DOM is valid, and we can just use the prefix.
                            // if this prefix conflicts with some other namespace
                            // then we re-declare it. If redeclaring it screws up
                            // other attributes in this Element, then the DOM
                            // was broken to start with.
                            if (attURI == null) {
                                // this can happen when the DOM is created
                                // without being namespace aware. we have a
                                // prefix, but the URI is not embedded in
                                // the Attribute itself. It must be declared
                                // on the element somewhere....
                                // https://github.com/hunterhacker/jdom/issues/138
                                attNS = element.getNamespace(attPrefix);
                            } else {
                                attNS = Namespace.getNamespace(attPrefix, attURI);
                            }
                        } else {
                            // OK, no prefix.
                            // must be a defaulted value from an XSD.
                            // perhaps we can find the namespace in our
                            // element's ancestry, and use the prefix from that.
                            HashMap<String, Namespace> tmpmap = new HashMap<String, Namespace>();
                            for (Namespace nss : element.getNamespacesInScope()) {
                                if (nss.getPrefix().length() > 0 && nss.getURI().equals(attURI)) {
                                    attNS = nss;
                                    break;
                                }
                                tmpmap.put(nss.getPrefix(), nss);
                            }
                            if (attNS == null) {
                                // we cannot find a 'prevailing' namespace that has a prefix
                                // that is for this namespace.
                                // This basically means that there's an XMLSchema, for the
                                // DEFAULT namespace, and there's a defaulted/fixed
                                // attribute definition in the XMLSchema that's targeted
                                // for this namespace,... but, the user has either not
                                // declared a prefixed version of the namespace, or has
                                // re-declared the same prefix at a lower level with a
                                // different namespace.
                                // All of these things are possible.
                                // Create some sort of default prefix.
                                int cnt = 0;
                                String base = "attns";
                                String pfx = base + cnt;
                                while (tmpmap.containsKey(pfx)) {
                                    cnt++;
                                    pfx = base + cnt;
                                }
                                attNS = Namespace.getNamespace(pfx, attURI);
                            }
                        }
                    }

                    Attribute attribute = factory.attribute(attLocalName, attvalue, attNS);
                    factory.setAttribute(element, attribute);
                }
            }

            // Recurse on child nodes
            // The list should never be null nor should it ever contain
            // null nodes, but some DOM impls are broken
            org.w3c.dom.NodeList children = node.getChildNodes();
            if (children != null) {
                int size = children.getLength();
                for (int i = 0; i < size; i++) {
                    org.w3c.dom.Node item = children.item(i);
                    if (item != null) {
                        buildTree(item, doc, element, false);
                    }
                }
            }
            break;

        case org.w3c.dom.Node.TEXT_NODE:
            factory.addContent(current, build((org.w3c.dom.Text) node));
            break;

        case org.w3c.dom.Node.CDATA_SECTION_NODE:
            factory.addContent(current, build((org.w3c.dom.CDATASection) node));
            break;

        case org.w3c.dom.Node.PROCESSING_INSTRUCTION_NODE:
            if (atRoot) {
                factory.addContent(doc, build((org.w3c.dom.ProcessingInstruction) node));
            } else {
                factory.addContent(current, build((org.w3c.dom.ProcessingInstruction) node));
            }
            break;

        case org.w3c.dom.Node.COMMENT_NODE:
            if (atRoot) {
                factory.addContent(doc, build((org.w3c.dom.Comment) node));
            } else {
                factory.addContent(current, build((org.w3c.dom.Comment) node));
            }
            break;

        case org.w3c.dom.Node.ENTITY_REFERENCE_NODE:
            factory.addContent(current, build((org.w3c.dom.EntityReference) node));
            break;

        case org.w3c.dom.Node.ENTITY_NODE:
            // ??
            break;

        case org.w3c.dom.Node.DOCUMENT_TYPE_NODE:

            factory.addContent(doc, build((org.w3c.dom.DocumentType) node));
            break;
        }
    }
}