001    /*
002     * Licensed to the Apache Software Foundation (ASF) under one
003     * or more contributor license agreements. See the NOTICE file
004     * distributed with this work for additional information
005     * regarding copyright ownership. The ASF licenses this file
006     * to you under the Apache License, Version 2.0 (the  "License");
007     * you may not use this file except in compliance with the License.
008     * You may obtain a copy of the License at
009     *
010     *     http://www.apache.org/licenses/LICENSE-2.0
011     *
012     * Unless required by applicable law or agreed to in writing, software
013     * distributed under the License is distributed on an "AS IS" BASIS,
014     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
015     * See the License for the specific language governing permissions and
016     * limitations under the License.
017     */
018    /*
019     * $Id: DTMIterator.java 468653 2006-10-28 07:07:05Z minchau $
020     */
021    package org.apache.xml.dtm;
022    
023    /**
024    
025     * <code>DTMIterators</code> are used to step through a (possibly
026     * filtered) set of nodes.  Their API is modeled largely after the DOM
027     * NodeIterator.
028     * 
029     * <p>A DTMIterator is a somewhat unusual type of iterator, in that it 
030     * can serve both single node iteration and random access.</p>
031     * 
032     * <p>The DTMIterator's traversal semantics, i.e. how it walks the tree,
033     * are specified when it is created, possibly and probably by an XPath
034     * <a href="http://www.w3.org/TR/xpath#NT-LocationPath>LocationPath</a> or 
035     * a <a href="http://www.w3.org/TR/xpath#NT-UnionExpr">UnionExpr</a>.</p>
036     * 
037     * <p>A DTMIterator is meant to be created once as a master static object, and 
038     * then cloned many times for runtime use.  Or the master object itself may 
039     * be used for simpler use cases.</p>
040     *
041     * <p>At this time, we do not expect DTMIterator to emulate
042     * NodeIterator's "maintain relative position" semantics under
043     * document mutation.  It's likely to respond more like the
044     * TreeWalker's "current node" semantics. However, since the base DTM
045     * is immutable, this issue currently makes no practical
046     * difference.</p>
047     *
048     * <p>State: In progress!!</p> */
049    public interface DTMIterator
050    {
051    
052      // Constants returned by acceptNode, borrowed from the DOM Traversal chapter
053      // %REVIEW% Should we explicitly initialize them from, eg,
054      // org.w3c.dom.traversal.NodeFilter.FILTER_ACCEPT?
055    
056      /**
057       * Accept the node.
058       */
059      public static final short FILTER_ACCEPT = 1;
060    
061      /**
062       * Reject the node. Same behavior as FILTER_SKIP. (In the DOM these
063       * differ when applied to a TreeWalker but have the same result when
064       * applied to a NodeIterator).
065       */
066      public static final short FILTER_REJECT = 2;
067    
068      /**
069       * Skip this single node. 
070       */
071      public static final short FILTER_SKIP = 3;
072        
073      /**
074       * Get an instance of a DTM that "owns" a node handle.  Since a node 
075       * iterator may be passed without a DTMManager, this allows the 
076       * caller to easily get the DTM using just the iterator.
077       *
078       * @param nodeHandle the nodeHandle.
079       *
080       * @return a non-null DTM reference.
081       */
082      public DTM getDTM(int nodeHandle);
083      
084      /**
085       * Get an instance of the DTMManager.  Since a node 
086       * iterator may be passed without a DTMManager, this allows the 
087       * caller to easily get the DTMManager using just the iterator.
088       *
089       * @return a non-null DTMManager reference.
090       */
091      public DTMManager getDTMManager();
092    
093      /**
094       * The root node of the <code>DTMIterator</code>, as specified when it
095       * was created.  Note the root node is not the root node of the 
096       * document tree, but the context node from where the iteration 
097       * begins and ends.
098       *
099       * @return nodeHandle int Handle of the context node.
100       */
101      public int getRoot();
102    
103      /**
104       * Reset the root node of the <code>DTMIterator</code>, overriding
105       * the value specified when it was created.  Note the root node is
106       * not the root node of the document tree, but the context node from
107       * where the iteration begins.
108       *
109       * @param nodeHandle int Handle of the context node.
110       * @param environment The environment object.  
111       * The environment in which this iterator operates, which should provide:
112       * <ul>
113       * <li>a node (the context node... same value as "root" defined below) </li>
114       * <li>a pair of non-zero positive integers (the context position and the context size) </li>
115       * <li>a set of variable bindings </li>
116       * <li>a function library </li>
117       * <li>the set of namespace declarations in scope for the expression.</li>
118       * <ul>
119       * 
120       * <p>At this time the exact implementation of this environment is application 
121       * dependent.  Probably a proper interface will be created fairly soon.</p>
122       * 
123       */
124      public void setRoot(int nodeHandle, Object environment);
125      
126      /**
127       * Reset the iterator to the start. After resetting, the next node returned
128       * will be the root node -- or, if that's filtered out, the first node
129       * within the root's subtree which is _not_ skipped by the filters.
130       */
131      public void reset();
132    
133      /**
134       * This attribute determines which node types are presented via the
135       * iterator. The available set of constants is defined above.  
136       * Nodes not accepted by
137       * <code>whatToShow</code> will be skipped, but their children may still
138       * be considered.
139       *
140       * @return one of the SHOW_XXX constants, or several ORed together.
141       */
142      public int getWhatToShow();
143    
144      /**
145       * <p>The value of this flag determines whether the children of entity
146       * reference nodes are visible to the iterator. If false, they  and
147       * their descendants will be rejected. Note that this rejection takes
148       * precedence over <code>whatToShow</code> and the filter. </p>
149       * 
150       * <p> To produce a view of the document that has entity references
151       * expanded and does not expose the entity reference node itself, use
152       * the <code>whatToShow</code> flags to hide the entity reference node
153       * and set <code>expandEntityReferences</code> to true when creating the
154       * iterator. To produce a view of the document that has entity reference
155       * nodes but no entity expansion, use the <code>whatToShow</code> flags
156       * to show the entity reference node and set
157       * <code>expandEntityReferences</code> to false.</p>
158       *
159       * <p>NOTE: In Xalan's use of DTM we will generally have fully expanded
160       * entity references when the document tree was built, and thus this
161       * flag will have no effect.</p>
162       *
163       * @return true if entity references will be expanded.  */
164      public boolean getExpandEntityReferences();
165    
166      /**
167       * Returns the next node in the set and advances the position of the
168       * iterator in the set. After a <code>DTMIterator</code> has setRoot called,
169       * the first call to <code>nextNode()</code> returns that root or (if it
170       * is rejected by the filters) the first node within its subtree which is
171       * not filtered out.
172       * @return The next node handle in the set being iterated over, or
173       *  <code>DTM.NULL</code> if there are no more members in that set.
174       */
175      public int nextNode();
176    
177      /**
178       * Returns the previous node in the set and moves the position of the
179       * <code>DTMIterator</code> backwards in the set.
180       * @return The previous node handle in the set being iterated over,
181       *   or <code>DTM.NULL</code> if there are no more members in that set.
182       */
183      public int previousNode();
184    
185      /**
186       * Detaches the <code>DTMIterator</code> from the set which it iterated
187       * over, releasing any computational resources and placing the iterator
188       * in the INVALID state. After <code>detach</code> has been invoked,
189       * calls to <code>nextNode</code> or <code>previousNode</code> will
190       * raise a runtime exception.
191       */
192      public void detach();
193      
194      /**
195       * Specify if it's OK for detach to release the iterator for reuse.
196       * 
197       * @param allowRelease true if it is OK for detach to release this iterator 
198       * for pooling.
199       */
200      public void allowDetachToRelease(boolean allowRelease);
201    
202      /**
203       * Get the current node in the iterator. Note that this differs from
204       * the DOM's NodeIterator, where the current position lies between two
205       * nodes (as part of the maintain-relative-position semantic).
206       *
207       * @return The current node handle, or -1.
208       */
209      public int getCurrentNode();
210    
211      /**
212       * Tells if this NodeSetDTM is "fresh", in other words, if
213       * the first nextNode() that is called will return the
214       * first node in the set.
215       *
216       * @return true if the iteration of this list has not yet begun.
217       */
218      public boolean isFresh();
219    
220      //========= Random Access ==========
221    
222      /**
223       * If setShouldCacheNodes(true) is called, then nodes will
224       * be cached, enabling random access, and giving the ability to do 
225       * sorts and the like.  They are not cached by default.
226       *
227       * %REVIEW% Shouldn't the other random-access methods throw an exception
228       * if they're called on a DTMIterator with this flag set false?
229       *
230       * @param b true if the nodes should be cached.
231       */
232      public void setShouldCacheNodes(boolean b);
233      
234      /**
235       * Tells if this iterator can have nodes added to it or set via 
236       * the <code>setItem(int node, int index)</code> method.
237       * 
238       * @return True if the nodelist can be mutated.
239       */
240      public boolean isMutable();
241    
242      /** Get the current position within the cached list, which is one
243       * less than the next nextNode() call will retrieve.  i.e. if you
244       * call getCurrentPos() and the return is 0, the next fetch will
245       * take place at index 1.
246       *
247       * @return The position of the iteration.
248       */
249      public int getCurrentPos();
250    
251      /**
252       * If an index is requested, NodeSetDTM will call this method
253       * to run the iterator to the index.  By default this sets
254       * m_next to the index.  If the index argument is -1, this
255       * signals that the iterator should be run to the end and
256       * completely fill the cache.
257       *
258       * @param index The index to run to, or -1 if the iterator should be run
259       *              to the end.
260       */
261      public void runTo(int index);
262    
263      /**
264       * Set the current position in the node set.
265       * 
266       * @param i Must be a valid index.
267       */
268      public void setCurrentPos(int i);
269    
270      /**
271       * Returns the <code>node handle</code> of an item in the collection. If
272       * <code>index</code> is greater than or equal to the number of nodes in
273       * the list, this returns <code>null</code>.
274       *
275       * @param index of the item.
276       * @return The node handle at the <code>index</code>th position in the
277       *   <code>DTMIterator</code>, or <code>-1</code> if that is not a valid
278       *   index.
279       */
280      public int item(int index);
281      
282      /**
283       * Sets the node at the specified index of this vector to be the
284       * specified node. The previous component at that position is discarded.
285       *
286       * <p>The index must be a value greater than or equal to 0 and less
287       * than the current size of the vector.  
288       * The iterator must be in cached mode.</p>
289       * 
290       * <p>Meant to be used for sorted iterators.</p>
291       *
292       * @param node Node to set
293       * @param index Index of where to set the node
294       */
295      public void setItem(int node, int index);
296      
297      /**
298       * The number of nodes in the list. The range of valid child node indices
299       * is 0 to <code>length-1</code> inclusive. Note that this requires running
300       * the iterator to completion, and presumably filling the cache.
301       *
302       * @return The number of nodes in the list.
303       */
304      public int getLength();
305        
306      //=========== Cloning operations. ============
307      
308      /**
309       * Get a cloned Iterator that is reset to the start of the iteration.
310       *
311       * @return A clone of this iteration that has been reset.
312       *
313       * @throws CloneNotSupportedException
314       */
315      public DTMIterator cloneWithReset() throws CloneNotSupportedException;
316    
317      /**
318       * Get a clone of this iterator, but don't reset the iteration in the 
319       * process, so that it may be used from the current position.
320       *
321       * @return A clone of this object.
322       *
323       * @throws CloneNotSupportedException
324       */
325      public Object clone() throws CloneNotSupportedException;
326      
327      /**
328       * Returns true if all the nodes in the iteration well be returned in document 
329       * order.
330       * 
331       * @return true if all the nodes in the iteration well be returned in document 
332       * order.
333       */
334      public boolean isDocOrdered();
335      
336      /**
337       * Returns the axis being iterated, if it is known.
338       * 
339       * @return Axis.CHILD, etc., or -1 if the axis is not known or is of multiple 
340       * types.
341       */
342      public int getAxis();
343    
344    }