Java HTML / XML How to - Access different types of DOM tree nodes








Question

We would like to know how to access different types of DOM tree nodes.

Answer

import java.io.StringReader;
/*w  ww  .  j  a  va2  s  . co m*/
import javax.xml.parsers.DocumentBuilderFactory;

import org.w3c.dom.Attr;
import org.w3c.dom.Comment;
import org.w3c.dom.Document;
import org.w3c.dom.Element;
import org.w3c.dom.Node;
import org.w3c.dom.CharacterData;
import org.w3c.dom.NodeList;
import org.w3c.dom.Text;
import org.xml.sax.InputSource;

public class Main {
  public static String getXMLData() {
    return "<a><person  number='' dept=''><name>myName</name></person></a>";
  }

  public static void main(String[] argv) throws Exception {
    DocumentBuilderFactory factory = DocumentBuilderFactory.newInstance();
    Document document = factory.newDocumentBuilder().parse(
        new InputSource(new StringReader(getXMLData())));

    Element purchaseOrder = document.getDocumentElement();
    printElement(purchaseOrder, "");
  }
  static void printElement(Element element, String indent) {
    System.out.println("Element '" + element.getNodeName() + "'");
    NodeList children = element.getChildNodes();
    for (int i = 0; i < children.getLength(); i++) {
      Node child = children.item(i);
      switch (child.getNodeType()) {
      case Node.ELEMENT_NODE:
        printElement((Element) child, indent + "\t");
        break;
      case Node.ATTRIBUTE_NODE:
        Attr attr = (Attr) child;
        System.out.println("\tAttribute: '" + attr.getName() + "' = '" + attr.getValue() + "'");
        break;
      case Node.COMMENT_NODE:
        Comment comment = (Comment) child;
        System.out.println("\tComment: '" + comment.getData() + "'");
        break;
      case Node.CDATA_SECTION_NODE:
        CharacterData cdata = (CharacterData) child;
        System.out.println("\tCDatat: '" + cdata.getData() + "'");
        break;
      case Node.TEXT_NODE:
        Text text = (Text) child;
        System.out.println("\tText: '" + text.getData() + "'");
        break;
      default:
        System.out.println("\tUnknown node type: '" + child.getNodeType() + "'");
        break;
      }
    }
  }

}

The code above generates the following result.