/** * Copyright 2008 - CommonCrawl Foundation * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see <http://www.gnu.org/licenses/>. * **/ package org.commoncrawl.util; import java.util.Stack; import org.w3c.dom.Node; import org.w3c.dom.NodeList; /** * <p> * A utility class that allows the walking of any DOM tree using a stack instead * of recursion. As the node tree is walked the next node is popped off of the * stack and all of its children are automatically added to the stack to be * called in tree order. * </p> * * <p> * Currently this class is not thread safe. It is assumed that only one thread * will be accessing the <code>NodeWalker</code> at any given time. * </p> */ public class NodeWalker { // the root node the the stack holding the nodes private Node currentNode; private NodeList currentChildren; private Stack<Node> nodes; /** * Starts the <code>Node</code> tree from the root node. * * @param rootNode */ public NodeWalker(Node rootNode) { nodes = new Stack<Node>(); nodes.add(rootNode); } /** * <p> * Returns the next <code>Node</code> on the stack and pushes all of its * children onto the stack, allowing us to walk the node tree without the use * of recursion. If there are no more nodes on the stack then null is * returned. * </p> * * @return Node The next <code>Node</code> on the stack or null if there isn't * a next node. */ public Node nextNode() { // if no next node return null if (!hasNext()) { return null; } // pop the next node off of the stack and push all of its children onto // the stack currentNode = nodes.pop(); currentChildren = currentNode.getChildNodes(); int childLen = (currentChildren != null) ? currentChildren.getLength() : 0; // put the children node on the stack in first to last order for (int i = childLen - 1; i >= 0; i--) { nodes.add(currentChildren.item(i)); } return currentNode; } /** * <p> * Skips over and removes from the node stack the children of the last node. * When getting a next node from the walker, that node's children are * automatically added to the stack. You can call this method to remove those * children from the stack. * </p> * * <p> * This is useful when you don't want to process deeper into the current path * of the node tree but you want to continue processing sibling nodes. * </p> * */ public void skipChildren() { int childLen = (currentChildren != null) ? currentChildren.getLength() : 0; for (int i = 0; i < childLen; i++) { Node child = nodes.peek(); if (child.equals(currentChildren.item(i))) { nodes.pop(); } } } /** * Returns true if there are more nodes on the current stack. * * @return */ public boolean hasNext() { return (nodes.size() > 0); } }