| 1 |  |  | 
| 2 |  |  | 
| 3 |  |  | 
| 4 |  |  | 
| 5 |  |  | 
| 6 |  |  | 
| 7 |  |  | 
| 8 |  | package org.dom4j.io; | 
| 9 |  |  | 
| 10 |  | import java.util.ArrayList; | 
| 11 |  | import java.util.List; | 
| 12 |  |  | 
| 13 |  | import org.dom4j.Branch; | 
| 14 |  | import org.dom4j.Document; | 
| 15 |  | import org.dom4j.DocumentFactory; | 
| 16 |  | import org.dom4j.Element; | 
| 17 |  | import org.dom4j.Namespace; | 
| 18 |  | import org.dom4j.QName; | 
| 19 |  | import org.dom4j.tree.NamespaceStack; | 
| 20 |  |  | 
| 21 |  |  | 
| 22 |  |  | 
| 23 |  |  | 
| 24 |  |  | 
| 25 |  |  | 
| 26 |  |  | 
| 27 |  |  | 
| 28 |  |  | 
| 29 |  |  | 
| 30 |  | public class DOMReader { | 
| 31 |  |  | 
| 32 |  | private DocumentFactory factory; | 
| 33 |  |  | 
| 34 |  |  | 
| 35 |  | private NamespaceStack namespaceStack; | 
| 36 |  |  | 
| 37 | 20 | public DOMReader() { | 
| 38 | 20 | this.factory = DocumentFactory.getInstance(); | 
| 39 | 20 | this.namespaceStack = new NamespaceStack(factory); | 
| 40 |  | } | 
| 41 |  |  | 
| 42 | 0 | public DOMReader(DocumentFactory factory) { | 
| 43 | 0 | this.factory = factory; | 
| 44 | 0 | this.namespaceStack = new NamespaceStack(factory); | 
| 45 |  | } | 
| 46 |  |  | 
| 47 |  |  | 
| 48 |  |  | 
| 49 |  |  | 
| 50 |  |  | 
| 51 |  |  | 
| 52 |  |  | 
| 53 | 20 | public DocumentFactory getDocumentFactory() { | 
| 54 | 20 | return factory; | 
| 55 |  | } | 
| 56 |  |  | 
| 57 |  |  | 
| 58 |  |  | 
| 59 |  |  | 
| 60 |  |  | 
| 61 |  |  | 
| 62 |  |  | 
| 63 |  |  | 
| 64 |  |  | 
| 65 |  |  | 
| 66 |  |  | 
| 67 |  |  | 
| 68 | 0 | public void setDocumentFactory(DocumentFactory docFactory) { | 
| 69 | 0 | this.factory = docFactory; | 
| 70 | 0 | this.namespaceStack.setDocumentFactory(factory); | 
| 71 |  | } | 
| 72 |  |  | 
| 73 | 20 | public Document read(org.w3c.dom.Document domDocument) { | 
| 74 | 20 | if (domDocument instanceof Document) { | 
| 75 | 0 | return (Document) domDocument; | 
| 76 |  | } | 
| 77 |  |  | 
| 78 | 20 | Document document = createDocument(); | 
| 79 |  |  | 
| 80 | 20 | clearNamespaceStack(); | 
| 81 |  |  | 
| 82 | 20 | org.w3c.dom.NodeList nodeList = domDocument.getChildNodes(); | 
| 83 |  |  | 
| 84 | 20 | for (int i = 0, size = nodeList.getLength(); i < size; i++) { | 
| 85 | 26 | readTree(nodeList.item(i), document); | 
| 86 |  | } | 
| 87 |  |  | 
| 88 | 20 | return document; | 
| 89 |  | } | 
| 90 |  |  | 
| 91 |  |  | 
| 92 | 14094 | protected void readTree(org.w3c.dom.Node node, Branch current) { | 
| 93 | 14094 | Element element = null; | 
| 94 | 14094 | Document document = null; | 
| 95 |  |  | 
| 96 | 14094 | if (current instanceof Element) { | 
| 97 | 14068 | element = (Element) current; | 
| 98 |  | } else { | 
| 99 | 26 | document = (Document) current; | 
| 100 |  | } | 
| 101 |  |  | 
| 102 | 14094 | switch (node.getNodeType()) { | 
| 103 | 5119 | case org.w3c.dom.Node.ELEMENT_NODE: | 
| 104 | 5119 | readElement(node, current); | 
| 105 |  |  | 
| 106 | 5119 | break; | 
| 107 |  |  | 
| 108 | 2 | case org.w3c.dom.Node.PROCESSING_INSTRUCTION_NODE: | 
| 109 |  |  | 
| 110 | 2 | if (current instanceof Element) { | 
| 111 | 0 | Element currentEl = (Element) current; | 
| 112 | 0 | currentEl.addProcessingInstruction(node.getNodeName(), node | 
| 113 |  | .getNodeValue()); | 
| 114 |  | } else { | 
| 115 | 2 | Document currentDoc = (Document) current; | 
| 116 | 2 | currentDoc.addProcessingInstruction(node.getNodeName(), | 
| 117 |  | node.getNodeValue()); | 
| 118 |  | } | 
| 119 |  |  | 
| 120 | 2 | break; | 
| 121 |  |  | 
| 122 | 70 | case org.w3c.dom.Node.COMMENT_NODE: | 
| 123 |  |  | 
| 124 | 70 | if (current instanceof Element) { | 
| 125 | 66 | ((Element) current).addComment(node.getNodeValue()); | 
| 126 |  | } else { | 
| 127 | 4 | ((Document) current).addComment(node.getNodeValue()); | 
| 128 |  | } | 
| 129 |  |  | 
| 130 | 70 | break; | 
| 131 |  |  | 
| 132 | 0 | case org.w3c.dom.Node.DOCUMENT_TYPE_NODE: | 
| 133 |  |  | 
| 134 | 0 | org.w3c.dom.DocumentType domDocType | 
| 135 |  | = (org.w3c.dom.DocumentType) node; | 
| 136 | 0 | document.addDocType(domDocType.getName(), domDocType | 
| 137 |  | .getPublicId(), domDocType.getSystemId()); | 
| 138 |  |  | 
| 139 | 0 | break; | 
| 140 |  |  | 
| 141 | 8873 | case org.w3c.dom.Node.TEXT_NODE: | 
| 142 | 8873 | element.addText(node.getNodeValue()); | 
| 143 |  |  | 
| 144 | 8873 | break; | 
| 145 |  |  | 
| 146 | 30 | case org.w3c.dom.Node.CDATA_SECTION_NODE: | 
| 147 | 30 | element.addCDATA(node.getNodeValue()); | 
| 148 |  |  | 
| 149 | 30 | break; | 
| 150 |  |  | 
| 151 | 0 | case org.w3c.dom.Node.ENTITY_REFERENCE_NODE: | 
| 152 |  |  | 
| 153 |  |  | 
| 154 | 0 | org.w3c.dom.Node firstChild = node.getFirstChild(); | 
| 155 |  |  | 
| 156 | 0 | if (firstChild != null) { | 
| 157 | 0 | element.addEntity(node.getNodeName(), firstChild | 
| 158 |  | .getNodeValue()); | 
| 159 |  | } else { | 
| 160 | 0 | element.addEntity(node.getNodeName(), ""); | 
| 161 |  | } | 
| 162 |  |  | 
| 163 | 0 | break; | 
| 164 |  |  | 
| 165 | 0 | case org.w3c.dom.Node.ENTITY_NODE: | 
| 166 | 0 | element.addEntity(node.getNodeName(), node.getNodeValue()); | 
| 167 |  |  | 
| 168 | 0 | break; | 
| 169 |  |  | 
| 170 | 0 | default: | 
| 171 | 0 | System.out.println("WARNING: Unknown DOM node type: " | 
| 172 |  | + node.getNodeType()); | 
| 173 |  | } | 
| 174 |  | } | 
| 175 |  |  | 
| 176 | 5119 | protected void readElement(org.w3c.dom.Node node, Branch current) { | 
| 177 | 5119 | int previouslyDeclaredNamespaces = namespaceStack.size(); | 
| 178 |  |  | 
| 179 | 5119 | String namespaceUri = node.getNamespaceURI(); | 
| 180 | 5119 | String elementPrefix = node.getPrefix(); | 
| 181 |  |  | 
| 182 | 5119 | if (elementPrefix == null) { | 
| 183 | 4751 | elementPrefix = ""; | 
| 184 |  | } | 
| 185 |  |  | 
| 186 | 5119 | org.w3c.dom.NamedNodeMap attributeList = node.getAttributes(); | 
| 187 |  |  | 
| 188 | 5119 | if ((attributeList != null) && (namespaceUri == null)) { | 
| 189 |  |  | 
| 190 | 4686 | org.w3c.dom.Node attribute = attributeList.getNamedItem("xmlns"); | 
| 191 |  |  | 
| 192 | 4686 | if (attribute != null) { | 
| 193 | 2 | namespaceUri = attribute.getNodeValue(); | 
| 194 | 2 | elementPrefix = ""; | 
| 195 |  | } | 
| 196 |  | } | 
| 197 |  |  | 
| 198 | 5119 | QName qName = namespaceStack.getQName(namespaceUri, | 
| 199 |  | node.getLocalName(), node.getNodeName()); | 
| 200 | 5119 | Element element = current.addElement(qName); | 
| 201 |  |  | 
| 202 | 5119 | if (attributeList != null) { | 
| 203 | 5119 | int size = attributeList.getLength(); | 
| 204 | 5119 | List attributes = new ArrayList(size); | 
| 205 |  |  | 
| 206 | 5119 | for (int i = 0; i < size; i++) { | 
| 207 | 2829 | org.w3c.dom.Node attribute = attributeList.item(i); | 
| 208 |  |  | 
| 209 |  |  | 
| 210 | 2829 | String name = attribute.getNodeName(); | 
| 211 |  |  | 
| 212 | 2829 | if (name.startsWith("xmlns")) { | 
| 213 | 52 | String prefix = getPrefix(name); | 
| 214 | 52 | String uri = attribute.getNodeValue(); | 
| 215 |  |  | 
| 216 | 52 | Namespace namespace = namespaceStack.addNamespace(prefix, | 
| 217 |  | uri); | 
| 218 | 52 | element.add(namespace); | 
| 219 |  | } else { | 
| 220 | 2777 | attributes.add(attribute); | 
| 221 |  | } | 
| 222 |  | } | 
| 223 |  |  | 
| 224 |  |  | 
| 225 | 5119 | size = attributes.size(); | 
| 226 |  |  | 
| 227 | 5119 | for (int i = 0; i < size; i++) { | 
| 228 | 2777 | org.w3c.dom.Node attribute = (org.w3c.dom.Node) attributes | 
| 229 |  | .get(i); | 
| 230 | 2777 | QName attributeQName = namespaceStack.getQName(attribute | 
| 231 |  | .getNamespaceURI(), attribute.getLocalName(), attribute | 
| 232 |  | .getNodeName()); | 
| 233 | 2777 | element.addAttribute(attributeQName, attribute.getNodeValue()); | 
| 234 |  | } | 
| 235 |  | } | 
| 236 |  |  | 
| 237 |  |  | 
| 238 | 5119 | org.w3c.dom.NodeList children = node.getChildNodes(); | 
| 239 |  |  | 
| 240 | 5119 | for (int i = 0, size = children.getLength(); i < size; i++) { | 
| 241 | 14068 | org.w3c.dom.Node child = children.item(i); | 
| 242 | 14068 | readTree(child, element); | 
| 243 |  | } | 
| 244 |  |  | 
| 245 |  |  | 
| 246 | 5119 | while (namespaceStack.size() > previouslyDeclaredNamespaces) { | 
| 247 | 52 | namespaceStack.pop(); | 
| 248 |  | } | 
| 249 |  | } | 
| 250 |  |  | 
| 251 | 0 | protected Namespace getNamespace(String prefix, String uri) { | 
| 252 | 0 | return getDocumentFactory().createNamespace(prefix, uri); | 
| 253 |  | } | 
| 254 |  |  | 
| 255 | 20 | protected Document createDocument() { | 
| 256 | 20 | return getDocumentFactory().createDocument(); | 
| 257 |  | } | 
| 258 |  |  | 
| 259 | 20 | protected void clearNamespaceStack() { | 
| 260 | 20 | namespaceStack.clear(); | 
| 261 |  |  | 
| 262 | 20 | if (!namespaceStack.contains(Namespace.XML_NAMESPACE)) { | 
| 263 | 20 | namespaceStack.push(Namespace.XML_NAMESPACE); | 
| 264 |  | } | 
| 265 |  | } | 
| 266 |  |  | 
| 267 | 52 | private String getPrefix(String xmlnsDecl) { | 
| 268 | 52 | int index = xmlnsDecl.indexOf(':', 5); | 
| 269 |  |  | 
| 270 | 52 | if (index != -1) { | 
| 271 | 30 | return xmlnsDecl.substring(index + 1); | 
| 272 |  | } else { | 
| 273 | 22 | return ""; | 
| 274 |  | } | 
| 275 |  | } | 
| 276 |  | } | 
| 277 |  |  | 
| 278 |  |  | 
| 279 |  |  | 
| 280 |  |  | 
| 281 |  |  | 
| 282 |  |  | 
| 283 |  |  | 
| 284 |  |  | 
| 285 |  |  | 
| 286 |  |  | 
| 287 |  |  | 
| 288 |  |  | 
| 289 |  |  | 
| 290 |  |  | 
| 291 |  |  | 
| 292 |  |  | 
| 293 |  |  | 
| 294 |  |  | 
| 295 |  |  | 
| 296 |  |  | 
| 297 |  |  | 
| 298 |  |  | 
| 299 |  |  | 
| 300 |  |  | 
| 301 |  |  | 
| 302 |  |  | 
| 303 |  |  | 
| 304 |  |  | 
| 305 |  |  | 
| 306 |  |  | 
| 307 |  |  | 
| 308 |  |  | 
| 309 |  |  | 
| 310 |  |  | 
| 311 |  |  | 
| 312 |  |  | 
| 313 |  |  |