001 /*
002 * Licensed to the Apache Software Foundation (ASF) under one
003 * or more contributor license agreements. See the NOTICE file
004 * distributed with this work for additional information
005 * regarding copyright ownership. The ASF licenses this file
006 * to you under the Apache License, Version 2.0 (the "License");
007 * you may not use this file except in compliance with the License.
008 * You may obtain a copy of the License at
009 *
010 * http://www.apache.org/licenses/LICENSE-2.0
011 *
012 * Unless required by applicable law or agreed to in writing, software
013 * distributed under the License is distributed on an "AS IS" BASIS,
014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
015 * See the License for the specific language governing permissions and
016 * limitations under the License.
017 */
018 /*
019 * $Id: DTMDefaultBase.java 1225429 2011-12-29 04:44:11Z mrglavas $
020 */
021 package org.apache.xml.dtm.ref;
022
023 import org.apache.xml.dtm.*;
024 import org.apache.xml.utils.SuballocatedIntVector;
025 import org.apache.xml.utils.BoolStack;
026
027 import java.util.Vector;
028
029 import javax.xml.transform.Source;
030
031 import org.apache.xml.utils.XMLString;
032 import org.apache.xml.utils.XMLStringFactory;
033
034 import org.apache.xml.res.XMLMessages;
035 import org.apache.xml.res.XMLErrorResources;
036
037 import java.io.*; // for dumpDTM
038
039 /**
040 * The <code>DTMDefaultBase</code> class serves as a helper base for DTMs.
041 * It sets up structures for navigation and type, while leaving data
042 * management and construction to the derived classes.
043 */
044 public abstract class DTMDefaultBase implements DTM
045 {
046 static final boolean JJK_DEBUG=false;
047
048 // This constant is likely to be removed in the future. Use the
049 // getDocument() method instead of ROOTNODE to get at the root
050 // node of a DTM.
051 /** The identity of the root node. */
052 public static final int ROOTNODE = 0;
053
054 /**
055 * The number of nodes, which is also used to determine the next
056 * node index.
057 */
058 protected int m_size = 0;
059
060 /** The expanded names, one array element for each node. */
061 protected SuballocatedIntVector m_exptype;
062
063 /** First child values, one array element for each node. */
064 protected SuballocatedIntVector m_firstch;
065
066 /** Next sibling values, one array element for each node. */
067 protected SuballocatedIntVector m_nextsib;
068
069 /** Previous sibling values, one array element for each node. */
070 protected SuballocatedIntVector m_prevsib;
071
072 /** Previous sibling values, one array element for each node. */
073 protected SuballocatedIntVector m_parent;
074
075 /** Vector of SuballocatedIntVectors of NS decl sets */
076 protected Vector m_namespaceDeclSets = null;
077
078 /** SuballocatedIntVector of elements at which corresponding
079 * namespaceDeclSets were defined */
080 protected SuballocatedIntVector m_namespaceDeclSetElements = null;
081
082 /**
083 * These hold indexes to elements based on namespace and local name.
084 * The base lookup is the the namespace. The second lookup is the local
085 * name, and the last array contains the the first free element
086 * at the start, and the list of element handles following.
087 */
088 protected int[][][] m_elemIndexes;
089
090 /** The default block size of the node arrays */
091 public static final int DEFAULT_BLOCKSIZE = 512; // favor small docs.
092
093 /** The number of blocks for the node arrays */
094 public static final int DEFAULT_NUMBLOCKS = 32;
095
096 /** The number of blocks used for small documents & RTFs */
097 public static final int DEFAULT_NUMBLOCKS_SMALL = 4;
098
099 /** The block size of the node arrays */
100 //protected final int m_blocksize;
101
102 /**
103 * The value to use when the information has not been built yet.
104 */
105 protected static final int NOTPROCESSED = DTM.NULL - 1;
106
107 /**
108 * The DTM manager who "owns" this DTM.
109 */
110
111 public DTMManager m_mgr;
112
113 /**
114 * m_mgr cast to DTMManagerDefault, or null if it isn't an instance
115 * (Efficiency hook)
116 */
117 protected DTMManagerDefault m_mgrDefault=null;
118
119
120 /** The document identity number(s). If we have overflowed the addressing
121 * range of the first that was assigned to us, we may add others. */
122 protected SuballocatedIntVector m_dtmIdent;
123
124 /** The mask for the identity.
125 %REVIEW% Should this really be set to the _DEFAULT? What if
126 a particular DTM wanted to use another value? */
127 //protected final static int m_mask = DTMManager.IDENT_NODE_DEFAULT;
128
129 /** The base URI for this document. */
130 protected String m_documentBaseURI;
131
132 /**
133 * The whitespace filter that enables elements to strip whitespace or not.
134 */
135 protected DTMWSFilter m_wsfilter;
136
137 /** Flag indicating whether to strip whitespace nodes */
138 protected boolean m_shouldStripWS = false;
139
140 /** Stack of flags indicating whether to strip whitespace nodes */
141 protected BoolStack m_shouldStripWhitespaceStack;
142
143 /** The XMLString factory for creating XMLStrings. */
144 protected XMLStringFactory m_xstrf;
145
146 /**
147 * The table for exandedNameID lookups. This may or may not be the same
148 * table as is contained in the DTMManagerDefault.
149 */
150 protected ExpandedNameTable m_expandedNameTable;
151
152 /** true if indexing is turned on. */
153 protected boolean m_indexing;
154
155 /**
156 * Construct a DTMDefaultBase object using the default block size.
157 *
158 * @param mgr The DTMManager who owns this DTM.
159 * @param source The object that is used to specify the construction source.
160 * @param dtmIdentity The DTM identity ID for this DTM.
161 * @param whiteSpaceFilter The white space filter for this DTM, which may
162 * be null.
163 * @param xstringfactory The factory to use for creating XMLStrings.
164 * @param doIndexing true if the caller considers it worth it to use
165 * indexing schemes.
166 */
167 public DTMDefaultBase(DTMManager mgr, Source source, int dtmIdentity,
168 DTMWSFilter whiteSpaceFilter,
169 XMLStringFactory xstringfactory, boolean doIndexing)
170 {
171 this(mgr, source, dtmIdentity, whiteSpaceFilter, xstringfactory,
172 doIndexing, DEFAULT_BLOCKSIZE, true, false);
173 }
174
175 /**
176 * Construct a DTMDefaultBase object from a DOM node.
177 *
178 * @param mgr The DTMManager who owns this DTM.
179 * @param source The object that is used to specify the construction source.
180 * @param dtmIdentity The DTM identity ID for this DTM.
181 * @param whiteSpaceFilter The white space filter for this DTM, which may
182 * be null.
183 * @param xstringfactory The factory to use for creating XMLStrings.
184 * @param doIndexing true if the caller considers it worth it to use
185 * indexing schemes.
186 * @param blocksize The block size of the DTM.
187 * @param usePrevsib true if we want to build the previous sibling node array.
188 * @param newNameTable true if we want to use a new ExpandedNameTable for this DTM.
189 */
190 public DTMDefaultBase(DTMManager mgr, Source source, int dtmIdentity,
191 DTMWSFilter whiteSpaceFilter,
192 XMLStringFactory xstringfactory, boolean doIndexing,
193 int blocksize, boolean usePrevsib,
194 boolean newNameTable)
195 {
196 // Use smaller sizes for the internal node arrays if the block size
197 // is small.
198 int numblocks;
199 if (blocksize <= 64)
200 {
201 numblocks = DEFAULT_NUMBLOCKS_SMALL;
202 m_dtmIdent= new SuballocatedIntVector(4, 1);
203 }
204 else
205 {
206 numblocks = DEFAULT_NUMBLOCKS;
207 m_dtmIdent= new SuballocatedIntVector(32);
208 }
209
210 m_exptype = new SuballocatedIntVector(blocksize, numblocks);
211 m_firstch = new SuballocatedIntVector(blocksize, numblocks);
212 m_nextsib = new SuballocatedIntVector(blocksize, numblocks);
213 m_parent = new SuballocatedIntVector(blocksize, numblocks);
214
215 // Only create the m_prevsib array if the usePrevsib flag is true.
216 // Some DTM implementations (e.g. SAXImpl) do not need this array.
217 // We can save the time to build it in those cases.
218 if (usePrevsib)
219 m_prevsib = new SuballocatedIntVector(blocksize, numblocks);
220
221 m_mgr = mgr;
222 if(mgr instanceof DTMManagerDefault)
223 m_mgrDefault=(DTMManagerDefault)mgr;
224
225 m_documentBaseURI = (null != source) ? source.getSystemId() : null;
226 m_dtmIdent.setElementAt(dtmIdentity,0);
227 m_wsfilter = whiteSpaceFilter;
228 m_xstrf = xstringfactory;
229 m_indexing = doIndexing;
230
231 if (doIndexing)
232 {
233 m_expandedNameTable = new ExpandedNameTable();
234 }
235 else
236 {
237 // Note that this fails if we aren't talking to an instance of
238 // DTMManagerDefault
239 m_expandedNameTable = m_mgrDefault.getExpandedNameTable(this);
240 }
241
242 if (null != whiteSpaceFilter)
243 {
244 m_shouldStripWhitespaceStack = new BoolStack();
245
246 pushShouldStripWhitespace(false);
247 }
248 }
249
250 /**
251 * Ensure that the size of the element indexes can hold the information.
252 *
253 * @param namespaceID Namespace ID index.
254 * @param LocalNameID Local name ID.
255 */
256 protected void ensureSizeOfIndex(int namespaceID, int LocalNameID)
257 {
258
259 if (null == m_elemIndexes)
260 {
261 m_elemIndexes = new int[namespaceID + 20][][];
262 }
263 else if (m_elemIndexes.length <= namespaceID)
264 {
265 int[][][] indexes = m_elemIndexes;
266
267 m_elemIndexes = new int[namespaceID + 20][][];
268
269 System.arraycopy(indexes, 0, m_elemIndexes, 0, indexes.length);
270 }
271
272 int[][] localNameIndex = m_elemIndexes[namespaceID];
273
274 if (null == localNameIndex)
275 {
276 localNameIndex = new int[LocalNameID + 100][];
277 m_elemIndexes[namespaceID] = localNameIndex;
278 }
279 else if (localNameIndex.length <= LocalNameID)
280 {
281 int[][] indexes = localNameIndex;
282
283 localNameIndex = new int[LocalNameID + 100][];
284
285 System.arraycopy(indexes, 0, localNameIndex, 0, indexes.length);
286
287 m_elemIndexes[namespaceID] = localNameIndex;
288 }
289
290 int[] elemHandles = localNameIndex[LocalNameID];
291
292 if (null == elemHandles)
293 {
294 elemHandles = new int[128];
295 localNameIndex[LocalNameID] = elemHandles;
296 elemHandles[0] = 1;
297 }
298 else if (elemHandles.length <= elemHandles[0] + 1)
299 {
300 int[] indexes = elemHandles;
301
302 elemHandles = new int[elemHandles[0] + 1024];
303
304 System.arraycopy(indexes, 0, elemHandles, 0, indexes.length);
305
306 localNameIndex[LocalNameID] = elemHandles;
307 }
308 }
309
310 /**
311 * Add a node to the element indexes. The node will not be added unless
312 * it's an element.
313 *
314 * @param expandedTypeID The expanded type ID of the node.
315 * @param identity The node identity index.
316 */
317 protected void indexNode(int expandedTypeID, int identity)
318 {
319
320 ExpandedNameTable ent = m_expandedNameTable;
321 short type = ent.getType(expandedTypeID);
322
323 if (DTM.ELEMENT_NODE == type)
324 {
325 int namespaceID = ent.getNamespaceID(expandedTypeID);
326 int localNameID = ent.getLocalNameID(expandedTypeID);
327
328 ensureSizeOfIndex(namespaceID, localNameID);
329
330 int[] index = m_elemIndexes[namespaceID][localNameID];
331
332 index[index[0]] = identity;
333
334 index[0]++;
335 }
336 }
337
338 /**
339 * Find the first index that occurs in the list that is greater than or
340 * equal to the given value.
341 *
342 * @param list A list of integers.
343 * @param start The start index to begin the search.
344 * @param len The number of items to search.
345 * @param value Find the slot that has a value that is greater than or
346 * identical to this argument.
347 *
348 * @return The index in the list of the slot that is higher or identical
349 * to the identity argument, or -1 if no node is higher or equal.
350 */
351 protected int findGTE(int[] list, int start, int len, int value)
352 {
353
354 int low = start;
355 int high = start + (len - 1);
356 int end = high;
357
358 while (low <= high)
359 {
360 int mid = (low + high) >>> 1;
361 int c = list[mid];
362
363 if (c > value)
364 high = mid - 1;
365 else if (c < value)
366 low = mid + 1;
367 else
368 return mid;
369 }
370
371 return (low <= end && list[low] > value) ? low : -1;
372 }
373
374 /**
375 * Find the first matching element from the index at or after the
376 * given node.
377 *
378 * @param nsIndex The namespace index lookup.
379 * @param lnIndex The local name index lookup.
380 * @param firstPotential The first potential match that is worth looking at.
381 *
382 * @return The first node that is greater than or equal to the
383 * firstPotential argument, or DTM.NOTPROCESSED if not found.
384 */
385 int findElementFromIndex(int nsIndex, int lnIndex, int firstPotential)
386 {
387
388 int[][][] indexes = m_elemIndexes;
389
390 if (null != indexes && nsIndex < indexes.length)
391 {
392 int[][] lnIndexs = indexes[nsIndex];
393
394 if (null != lnIndexs && lnIndex < lnIndexs.length)
395 {
396 int[] elems = lnIndexs[lnIndex];
397
398 if (null != elems)
399 {
400 int pos = findGTE(elems, 1, elems[0], firstPotential);
401
402 if (pos > -1)
403 {
404 return elems[pos];
405 }
406 }
407 }
408 }
409
410 return NOTPROCESSED;
411 }
412
413 /**
414 * Get the next node identity value in the list, and call the iterator
415 * if it hasn't been added yet.
416 *
417 * @param identity The node identity (index).
418 * @return identity+1, or DTM.NULL.
419 */
420 protected abstract int getNextNodeIdentity(int identity);
421
422 /**
423 * This method should try and build one or more nodes in the table.
424 *
425 * @return The true if a next node is found or false if
426 * there are no more nodes.
427 */
428 protected abstract boolean nextNode();
429
430 /**
431 * Get the number of nodes that have been added.
432 *
433 * @return the number of nodes that have been mapped.
434 */
435 protected abstract int getNumberOfNodes();
436
437 /** Stateless axis traversers, lazely built. */
438 protected DTMAxisTraverser[] m_traversers;
439
440 // /**
441 // * Ensure that the size of the information arrays can hold another entry
442 // * at the given index.
443 // *
444 // * @param index On exit from this function, the information arrays sizes must be
445 // * at least index+1.
446 // */
447 // protected void ensureSize(int index)
448 // {
449 // // We've cut over to Suballocated*Vector, which are self-sizing.
450 // }
451
452 /**
453 * Get the simple type ID for the given node identity.
454 *
455 * @param identity The node identity.
456 *
457 * @return The simple type ID, or DTM.NULL.
458 */
459 protected short _type(int identity)
460 {
461
462 int info = _exptype(identity);
463
464 if (NULL != info)
465 return m_expandedNameTable.getType(info);
466 else
467 return NULL;
468 }
469
470 /**
471 * Get the expanded type ID for the given node identity.
472 *
473 * @param identity The node identity.
474 *
475 * @return The expanded type ID, or DTM.NULL.
476 */
477 protected int _exptype(int identity)
478 {
479 if (identity == DTM.NULL)
480 return NULL;
481 // Reorganized test and loop into single flow
482 // Tiny performance improvement, saves a few bytes of code, clearer.
483 // %OPT% Other internal getters could be treated simliarly
484 while (identity>=m_size)
485 {
486 if (!nextNode() && identity >= m_size)
487 return NULL;
488 }
489 return m_exptype.elementAt(identity);
490
491 }
492
493 /**
494 * Get the level in the tree for the given node identity.
495 *
496 * @param identity The node identity.
497 *
498 * @return The tree level, or DTM.NULL.
499 */
500 protected int _level(int identity)
501 {
502 while (identity>=m_size)
503 {
504 boolean isMore = nextNode();
505 if (!isMore && identity >= m_size)
506 return NULL;
507 }
508
509 int i=0;
510 while(NULL != (identity=_parent(identity)))
511 ++i;
512 return i;
513 }
514
515 /**
516 * Get the first child for the given node identity.
517 *
518 * @param identity The node identity.
519 *
520 * @return The first child identity, or DTM.NULL.
521 */
522 protected int _firstch(int identity)
523 {
524
525 // Boiler-plate code for each of the _xxx functions, except for the array.
526 int info = (identity >= m_size) ? NOTPROCESSED : m_firstch.elementAt(identity);
527
528 // Check to see if the information requested has been processed, and,
529 // if not, advance the iterator until we the information has been
530 // processed.
531 while (info == NOTPROCESSED)
532 {
533 boolean isMore = nextNode();
534
535 if (identity >= m_size &&!isMore)
536 return NULL;
537 else
538 {
539 info = m_firstch.elementAt(identity);
540 if(info == NOTPROCESSED && !isMore)
541 return NULL;
542 }
543 }
544
545 return info;
546 }
547
548 /**
549 * Get the next sibling for the given node identity.
550 *
551 * @param identity The node identity.
552 *
553 * @return The next sibling identity, or DTM.NULL.
554 */
555 protected int _nextsib(int identity)
556 {
557 // Boiler-plate code for each of the _xxx functions, except for the array.
558 int info = (identity >= m_size) ? NOTPROCESSED : m_nextsib.elementAt(identity);
559
560 // Check to see if the information requested has been processed, and,
561 // if not, advance the iterator until we the information has been
562 // processed.
563 while (info == NOTPROCESSED)
564 {
565 boolean isMore = nextNode();
566
567 if (identity >= m_size &&!isMore)
568 return NULL;
569 else
570 {
571 info = m_nextsib.elementAt(identity);
572 if(info == NOTPROCESSED && !isMore)
573 return NULL;
574 }
575 }
576
577 return info;
578 }
579
580 /**
581 * Get the previous sibling for the given node identity.
582 *
583 * @param identity The node identity.
584 *
585 * @return The previous sibling identity, or DTM.NULL.
586 */
587 protected int _prevsib(int identity)
588 {
589
590 if (identity < m_size)
591 return m_prevsib.elementAt(identity);
592
593 // Check to see if the information requested has been processed, and,
594 // if not, advance the iterator until we the information has been
595 // processed.
596 while (true)
597 {
598 boolean isMore = nextNode();
599
600 if (identity >= m_size && !isMore)
601 return NULL;
602 else if (identity < m_size)
603 return m_prevsib.elementAt(identity);
604 }
605 }
606
607 /**
608 * Get the parent for the given node identity.
609 *
610 * @param identity The node identity.
611 *
612 * @return The parent identity, or DTM.NULL.
613 */
614 protected int _parent(int identity)
615 {
616
617 if (identity < m_size)
618 return m_parent.elementAt(identity);
619
620 // Check to see if the information requested has been processed, and,
621 // if not, advance the iterator until we the information has been
622 // processed.
623 while (true)
624 {
625 boolean isMore = nextNode();
626
627 if (identity >= m_size && !isMore)
628 return NULL;
629 else if (identity < m_size)
630 return m_parent.elementAt(identity);
631 }
632 }
633
634 /**
635 * Diagnostics function to dump the DTM.
636 */
637 public void dumpDTM(OutputStream os)
638 {
639 try
640 {
641 if(os==null)
642 {
643 File f = new File("DTMDump"+((Object)this).hashCode()+".txt");
644 System.err.println("Dumping... "+f.getAbsolutePath());
645 os=new FileOutputStream(f);
646 }
647 PrintStream ps = new PrintStream(os);
648
649 while (nextNode()){}
650
651 int nRecords = m_size;
652
653 ps.println("Total nodes: " + nRecords);
654
655 for (int index = 0; index < nRecords; ++index)
656 {
657 int i=makeNodeHandle(index);
658 ps.println("=========== index=" + index + " handle=" + i + " ===========");
659 ps.println("NodeName: " + getNodeName(i));
660 ps.println("NodeNameX: " + getNodeNameX(i));
661 ps.println("LocalName: " + getLocalName(i));
662 ps.println("NamespaceURI: " + getNamespaceURI(i));
663 ps.println("Prefix: " + getPrefix(i));
664
665 int exTypeID = _exptype(index);
666
667 ps.println("Expanded Type ID: "
668 + Integer.toHexString(exTypeID));
669
670 int type = _type(index);
671 String typestring;
672
673 switch (type)
674 {
675 case DTM.ATTRIBUTE_NODE :
676 typestring = "ATTRIBUTE_NODE";
677 break;
678 case DTM.CDATA_SECTION_NODE :
679 typestring = "CDATA_SECTION_NODE";
680 break;
681 case DTM.COMMENT_NODE :
682 typestring = "COMMENT_NODE";
683 break;
684 case DTM.DOCUMENT_FRAGMENT_NODE :
685 typestring = "DOCUMENT_FRAGMENT_NODE";
686 break;
687 case DTM.DOCUMENT_NODE :
688 typestring = "DOCUMENT_NODE";
689 break;
690 case DTM.DOCUMENT_TYPE_NODE :
691 typestring = "DOCUMENT_NODE";
692 break;
693 case DTM.ELEMENT_NODE :
694 typestring = "ELEMENT_NODE";
695 break;
696 case DTM.ENTITY_NODE :
697 typestring = "ENTITY_NODE";
698 break;
699 case DTM.ENTITY_REFERENCE_NODE :
700 typestring = "ENTITY_REFERENCE_NODE";
701 break;
702 case DTM.NAMESPACE_NODE :
703 typestring = "NAMESPACE_NODE";
704 break;
705 case DTM.NOTATION_NODE :
706 typestring = "NOTATION_NODE";
707 break;
708 case DTM.NULL :
709 typestring = "NULL";
710 break;
711 case DTM.PROCESSING_INSTRUCTION_NODE :
712 typestring = "PROCESSING_INSTRUCTION_NODE";
713 break;
714 case DTM.TEXT_NODE :
715 typestring = "TEXT_NODE";
716 break;
717 default :
718 typestring = "Unknown!";
719 break;
720 }
721
722 ps.println("Type: " + typestring);
723
724 int firstChild = _firstch(index);
725
726 if (DTM.NULL == firstChild)
727 ps.println("First child: DTM.NULL");
728 else if (NOTPROCESSED == firstChild)
729 ps.println("First child: NOTPROCESSED");
730 else
731 ps.println("First child: " + firstChild);
732
733 if (m_prevsib != null)
734 {
735 int prevSibling = _prevsib(index);
736
737 if (DTM.NULL == prevSibling)
738 ps.println("Prev sibling: DTM.NULL");
739 else if (NOTPROCESSED == prevSibling)
740 ps.println("Prev sibling: NOTPROCESSED");
741 else
742 ps.println("Prev sibling: " + prevSibling);
743 }
744
745 int nextSibling = _nextsib(index);
746
747 if (DTM.NULL == nextSibling)
748 ps.println("Next sibling: DTM.NULL");
749 else if (NOTPROCESSED == nextSibling)
750 ps.println("Next sibling: NOTPROCESSED");
751 else
752 ps.println("Next sibling: " + nextSibling);
753
754 int parent = _parent(index);
755
756 if (DTM.NULL == parent)
757 ps.println("Parent: DTM.NULL");
758 else if (NOTPROCESSED == parent)
759 ps.println("Parent: NOTPROCESSED");
760 else
761 ps.println("Parent: " + parent);
762
763 int level = _level(index);
764
765 ps.println("Level: " + level);
766 ps.println("Node Value: " + getNodeValue(i));
767 ps.println("String Value: " + getStringValue(i));
768 }
769 }
770 catch(IOException ioe)
771 {
772 ioe.printStackTrace(System.err);
773 throw new RuntimeException(ioe.getMessage());
774 }
775 }
776
777 /**
778 * Diagnostics function to dump a single node.
779 *
780 * %REVIEW% KNOWN GLITCH: If you pass it a node index rather than a
781 * node handle, it works just fine... but the displayed identity
782 * number before the colon is different, which complicates comparing
783 * it with nodes printed the other way. We could always OR the DTM ID
784 * into the value, to suppress that distinction...
785 *
786 * %REVIEW% This might want to be moved up to DTMDefaultBase, or possibly
787 * DTM itself, since it's a useful diagnostic and uses only DTM's public
788 * APIs.
789 */
790 public String dumpNode(int nodeHandle)
791 {
792 if(nodeHandle==DTM.NULL)
793 return "[null]";
794
795 String typestring;
796 switch (getNodeType(nodeHandle))
797 {
798 case DTM.ATTRIBUTE_NODE :
799 typestring = "ATTR";
800 break;
801 case DTM.CDATA_SECTION_NODE :
802 typestring = "CDATA";
803 break;
804 case DTM.COMMENT_NODE :
805 typestring = "COMMENT";
806 break;
807 case DTM.DOCUMENT_FRAGMENT_NODE :
808 typestring = "DOC_FRAG";
809 break;
810 case DTM.DOCUMENT_NODE :
811 typestring = "DOC";
812 break;
813 case DTM.DOCUMENT_TYPE_NODE :
814 typestring = "DOC_TYPE";
815 break;
816 case DTM.ELEMENT_NODE :
817 typestring = "ELEMENT";
818 break;
819 case DTM.ENTITY_NODE :
820 typestring = "ENTITY";
821 break;
822 case DTM.ENTITY_REFERENCE_NODE :
823 typestring = "ENT_REF";
824 break;
825 case DTM.NAMESPACE_NODE :
826 typestring = "NAMESPACE";
827 break;
828 case DTM.NOTATION_NODE :
829 typestring = "NOTATION";
830 break;
831 case DTM.NULL :
832 typestring = "null";
833 break;
834 case DTM.PROCESSING_INSTRUCTION_NODE :
835 typestring = "PI";
836 break;
837 case DTM.TEXT_NODE :
838 typestring = "TEXT";
839 break;
840 default :
841 typestring = "Unknown!";
842 break;
843 }
844
845 StringBuffer sb=new StringBuffer();
846 sb.append("["+nodeHandle+": "+typestring+
847 "(0x"+Integer.toHexString(getExpandedTypeID(nodeHandle))+") "+
848 getNodeNameX(nodeHandle)+" {"+getNamespaceURI(nodeHandle)+"}"+
849 "=\""+ getNodeValue(nodeHandle)+"\"]");
850 return sb.toString();
851 }
852
853 // ========= DTM Implementation Control Functions. ==============
854
855 /**
856 * Set an implementation dependent feature.
857 * <p>
858 * %REVIEW% Do we really expect to set features on DTMs?
859 *
860 * @param featureId A feature URL.
861 * @param state true if this feature should be on, false otherwise.
862 */
863 public void setFeature(String featureId, boolean state){}
864
865 // ========= Document Navigation Functions =========
866
867 /**
868 * Given a node handle, test if it has child nodes.
869 * <p> %REVIEW% This is obviously useful at the DOM layer, where it
870 * would permit testing this without having to create a proxy
871 * node. It's less useful in the DTM API, where
872 * (dtm.getFirstChild(nodeHandle)!=DTM.NULL) is just as fast and
873 * almost as self-evident. But it's a convenience, and eases porting
874 * of DOM code to DTM. </p>
875 *
876 * @param nodeHandle int Handle of the node.
877 * @return int true if the given node has child nodes.
878 */
879 public boolean hasChildNodes(int nodeHandle)
880 {
881
882 int identity = makeNodeIdentity(nodeHandle);
883 int firstChild = _firstch(identity);
884
885 return firstChild != DTM.NULL;
886 }
887
888 /** Given a node identity, return a node handle. If extended addressing
889 * has been used (multiple DTM IDs), we need to map the high bits of the
890 * identity into the proper DTM ID.
891 *
892 * This has been made FINAL to facilitate inlining, since we do not expect
893 * any subclass of DTMDefaultBase to ever change the algorithm. (I don't
894 * really like doing so, and would love to have an excuse not to...)
895 *
896 * %REVIEW% Is it worth trying to specialcase small documents?
897 * %REVIEW% Should this be exposed at the package/public layers?
898 *
899 * @param nodeIdentity Internal offset to this node's records.
900 * @return NodeHandle (external representation of node)
901 * */
902 final public int makeNodeHandle(int nodeIdentity)
903 {
904 if(NULL==nodeIdentity) return NULL;
905
906 if(JJK_DEBUG && nodeIdentity>DTMManager.IDENT_NODE_DEFAULT)
907 System.err.println("GONK! (only useful in limited situations)");
908
909 return m_dtmIdent.elementAt(nodeIdentity >>> DTMManager.IDENT_DTM_NODE_BITS)
910 + (nodeIdentity & DTMManager.IDENT_NODE_DEFAULT) ;
911 }
912
913 /** Given a node handle, return a node identity. If extended addressing
914 * has been used (multiple DTM IDs), we need to map the high bits of the
915 * identity into the proper DTM ID and thence find the proper offset
916 * to add to the low bits of the identity
917 *
918 * This has been made FINAL to facilitate inlining, since we do not expect
919 * any subclass of DTMDefaultBase to ever change the algorithm. (I don't
920 * really like doing so, and would love to have an excuse not to...)
921 *
922 * %OPT% Performance is critical for this operation.
923 *
924 * %REVIEW% Should this be exposed at the package/public layers?
925 *
926 * @param nodeHandle (external representation of node)
927 * @return nodeIdentity Internal offset to this node's records.
928 * */
929 final public int makeNodeIdentity(int nodeHandle)
930 {
931 if(NULL==nodeHandle) return NULL;
932
933 if(m_mgrDefault!=null)
934 {
935 // Optimization: use the DTMManagerDefault's fast DTMID-to-offsets
936 // table. I'm not wild about this solution but this operation
937 // needs need extreme speed.
938
939 int whichDTMindex=nodeHandle>>>DTMManager.IDENT_DTM_NODE_BITS;
940
941 // %REVIEW% Wish I didn't have to perform the pre-test, but
942 // someone is apparently asking DTMs whether they contain nodes
943 // which really don't belong to them. That's probably a bug
944 // which should be fixed, but until it is:
945 if(m_mgrDefault.m_dtms[whichDTMindex]!=this)
946 return NULL;
947 else
948 return
949 m_mgrDefault.m_dtm_offsets[whichDTMindex]
950 | (nodeHandle & DTMManager.IDENT_NODE_DEFAULT);
951 }
952
953 int whichDTMid=m_dtmIdent.indexOf(nodeHandle & DTMManager.IDENT_DTM_DEFAULT);
954 return (whichDTMid==NULL)
955 ? NULL
956 : (whichDTMid << DTMManager.IDENT_DTM_NODE_BITS)
957 + (nodeHandle & DTMManager.IDENT_NODE_DEFAULT);
958 }
959
960
961 /**
962 * Given a node handle, get the handle of the node's first child.
963 * If not yet resolved, waits for more nodes to be added to the document and
964 * tries again.
965 *
966 * @param nodeHandle int Handle of the node.
967 * @return int DTM node-number of first child, or DTM.NULL to indicate none exists.
968 */
969 public int getFirstChild(int nodeHandle)
970 {
971
972 int identity = makeNodeIdentity(nodeHandle);
973 int firstChild = _firstch(identity);
974
975 return makeNodeHandle(firstChild);
976 }
977
978 /**
979 * Given a node handle, get the handle of the node's first child.
980 * If not yet resolved, waits for more nodes to be added to the document and
981 * tries again.
982 *
983 * @param nodeHandle int Handle of the node.
984 * @return int DTM node-number of first child, or DTM.NULL to indicate none exists.
985 */
986 public int getTypedFirstChild(int nodeHandle, int nodeType)
987 {
988
989 int firstChild, eType;
990 if (nodeType < DTM.NTYPES) {
991 for (firstChild = _firstch(makeNodeIdentity(nodeHandle));
992 firstChild != DTM.NULL;
993 firstChild = _nextsib(firstChild)) {
994 eType = _exptype(firstChild);
995 if (eType == nodeType
996 || (eType >= DTM.NTYPES
997 && m_expandedNameTable.getType(eType) == nodeType)) {
998 return makeNodeHandle(firstChild);
999 }
1000 }
1001 } else {
1002 for (firstChild = _firstch(makeNodeIdentity(nodeHandle));
1003 firstChild != DTM.NULL;
1004 firstChild = _nextsib(firstChild)) {
1005 if (_exptype(firstChild) == nodeType) {
1006 return makeNodeHandle(firstChild);
1007 }
1008 }
1009 }
1010 return DTM.NULL;
1011 }
1012
1013 /**
1014 * Given a node handle, advance to its last child.
1015 * If not yet resolved, waits for more nodes to be added to the document and
1016 * tries again.
1017 *
1018 * @param nodeHandle int Handle of the node.
1019 * @return int Node-number of last child,
1020 * or DTM.NULL to indicate none exists.
1021 */
1022 public int getLastChild(int nodeHandle)
1023 {
1024
1025 int identity = makeNodeIdentity(nodeHandle);
1026 int child = _firstch(identity);
1027 int lastChild = DTM.NULL;
1028
1029 while (child != DTM.NULL)
1030 {
1031 lastChild = child;
1032 child = _nextsib(child);
1033 }
1034
1035 return makeNodeHandle(lastChild);
1036 }
1037
1038 /**
1039 * Retrieves an attribute node by by qualified name and namespace URI.
1040 *
1041 * @param nodeHandle int Handle of the node upon which to look up this attribute..
1042 * @param namespaceURI The namespace URI of the attribute to
1043 * retrieve, or null.
1044 * @param name The local name of the attribute to
1045 * retrieve.
1046 * @return The attribute node handle with the specified name (
1047 * <code>nodeName</code>) or <code>DTM.NULL</code> if there is no such
1048 * attribute.
1049 */
1050 public abstract int getAttributeNode(int nodeHandle, String namespaceURI,
1051 String name);
1052
1053 /**
1054 * Given a node handle, get the index of the node's first attribute.
1055 *
1056 * @param nodeHandle int Handle of the node.
1057 * @return Handle of first attribute, or DTM.NULL to indicate none exists.
1058 */
1059 public int getFirstAttribute(int nodeHandle)
1060 {
1061 int nodeID = makeNodeIdentity(nodeHandle);
1062
1063 return makeNodeHandle(getFirstAttributeIdentity(nodeID));
1064 }
1065
1066 /**
1067 * Given a node identity, get the index of the node's first attribute.
1068 *
1069 * @param identity int identity of the node.
1070 * @return Identity of first attribute, or DTM.NULL to indicate none exists.
1071 */
1072 protected int getFirstAttributeIdentity(int identity) {
1073 int type = _type(identity);
1074
1075 if (DTM.ELEMENT_NODE == type)
1076 {
1077 // Assume that attributes and namespaces immediately follow the element.
1078 while (DTM.NULL != (identity = getNextNodeIdentity(identity)))
1079 {
1080
1081 // Assume this can not be null.
1082 type = _type(identity);
1083
1084 if (type == DTM.ATTRIBUTE_NODE)
1085 {
1086 return identity;
1087 }
1088 else if (DTM.NAMESPACE_NODE != type)
1089 {
1090 break;
1091 }
1092 }
1093 }
1094
1095 return DTM.NULL;
1096 }
1097
1098 /**
1099 * Given a node handle and an expanded type ID, get the index of the node's
1100 * attribute of that type, if any.
1101 *
1102 * @param nodeHandle int Handle of the node.
1103 * @param attType int expanded type ID of the required attribute.
1104 * @return Handle of attribute of the required type, or DTM.NULL to indicate
1105 * none exists.
1106 */
1107 protected int getTypedAttribute(int nodeHandle, int attType) {
1108 int type = getNodeType(nodeHandle);
1109 if (DTM.ELEMENT_NODE == type) {
1110 int identity = makeNodeIdentity(nodeHandle);
1111
1112 while (DTM.NULL != (identity = getNextNodeIdentity(identity)))
1113 {
1114 type = _type(identity);
1115
1116 if (type == DTM.ATTRIBUTE_NODE)
1117 {
1118 if (_exptype(identity) == attType) return makeNodeHandle(identity);
1119 }
1120 else if (DTM.NAMESPACE_NODE != type)
1121 {
1122 break;
1123 }
1124 }
1125 }
1126
1127 return DTM.NULL;
1128 }
1129
1130 /**
1131 * Given a node handle, advance to its next sibling.
1132 * If not yet resolved, waits for more nodes to be added to the document and
1133 * tries again.
1134 * @param nodeHandle int Handle of the node.
1135 * @return int Node-number of next sibling,
1136 * or DTM.NULL to indicate none exists.
1137 */
1138 public int getNextSibling(int nodeHandle)
1139 {
1140 if (nodeHandle == DTM.NULL)
1141 return DTM.NULL;
1142 return makeNodeHandle(_nextsib(makeNodeIdentity(nodeHandle)));
1143 }
1144
1145 /**
1146 * Given a node handle, advance to its next sibling.
1147 * If not yet resolved, waits for more nodes to be added to the document and
1148 * tries again.
1149 * @param nodeHandle int Handle of the node.
1150 * @return int Node-number of next sibling,
1151 * or DTM.NULL to indicate none exists.
1152 */
1153 public int getTypedNextSibling(int nodeHandle, int nodeType)
1154 {
1155 if (nodeHandle == DTM.NULL)
1156 return DTM.NULL;
1157 int node = makeNodeIdentity(nodeHandle);
1158 int eType;
1159 while ((node = _nextsib(node)) != DTM.NULL &&
1160 ((eType = _exptype(node)) != nodeType &&
1161 m_expandedNameTable.getType(eType)!= nodeType));
1162 //_type(node) != nodeType));
1163
1164 return (node == DTM.NULL ? DTM.NULL : makeNodeHandle(node));
1165 }
1166
1167 /**
1168 * Given a node handle, find its preceeding sibling.
1169 * WARNING: DTM is asymmetric; this operation is resolved by search, and is
1170 * relatively expensive.
1171 *
1172 * @param nodeHandle the id of the node.
1173 * @return int Node-number of the previous sib,
1174 * or DTM.NULL to indicate none exists.
1175 */
1176 public int getPreviousSibling(int nodeHandle)
1177 {
1178 if (nodeHandle == DTM.NULL)
1179 return DTM.NULL;
1180
1181 if (m_prevsib != null)
1182 return makeNodeHandle(_prevsib(makeNodeIdentity(nodeHandle)));
1183 else
1184 {
1185 // If the previous sibling array is not built, we get at
1186 // the previous sibling using the parent, firstch and
1187 // nextsib arrays.
1188 int nodeID = makeNodeIdentity(nodeHandle);
1189 int parent = _parent(nodeID);
1190 int node = _firstch(parent);
1191 int result = DTM.NULL;
1192 while (node != nodeID)
1193 {
1194 result = node;
1195 node = _nextsib(node);
1196 }
1197 return makeNodeHandle(result);
1198 }
1199 }
1200
1201 /**
1202 * Given a node handle, advance to the next attribute.
1203 * If an attr, we advance to
1204 * the next attr on the same node. If not an attribute, we return NULL.
1205 *
1206 * @param nodeHandle int Handle of the node.
1207 * @return int DTM node-number of the resolved attr,
1208 * or DTM.NULL to indicate none exists.
1209 */
1210 public int getNextAttribute(int nodeHandle) {
1211 int nodeID = makeNodeIdentity(nodeHandle);
1212
1213 if (_type(nodeID) == DTM.ATTRIBUTE_NODE) {
1214 return makeNodeHandle(getNextAttributeIdentity(nodeID));
1215 }
1216
1217 return DTM.NULL;
1218 }
1219
1220 /**
1221 * Given a node identity for an attribute, advance to the next attribute.
1222 *
1223 * @param identity int identity of the attribute node. This
1224 * <strong>must</strong> be an attribute node.
1225 *
1226 * @return int DTM node-identity of the resolved attr,
1227 * or DTM.NULL to indicate none exists.
1228 *
1229 */
1230 protected int getNextAttributeIdentity(int identity) {
1231 // Assume that attributes and namespace nodes immediately follow the element
1232 while (DTM.NULL != (identity = getNextNodeIdentity(identity))) {
1233 int type = _type(identity);
1234
1235 if (type == DTM.ATTRIBUTE_NODE) {
1236 return identity;
1237 } else if (type != DTM.NAMESPACE_NODE) {
1238 break;
1239 }
1240 }
1241
1242 return DTM.NULL;
1243 }
1244
1245 /** Lazily created namespace lists. */
1246 private Vector m_namespaceLists = null; // on demand
1247
1248
1249 /** Build table of namespace declaration
1250 * locations during DTM construction. Table is a Vector of
1251 * SuballocatedIntVectors containing the namespace node HANDLES declared at
1252 * that ID, plus an SuballocatedIntVector of the element node INDEXES at which
1253 * these declarations appeared.
1254 *
1255 * NOTE: Since this occurs during model build, nodes will be encountered
1256 * in doucment order and thus the table will be ordered by element,
1257 * permitting binary-search as a possible retrieval optimization.
1258 *
1259 * %REVIEW% Directly managed arrays rather than vectors?
1260 * %REVIEW% Handles or IDs? Given usage, I think handles.
1261 * */
1262 protected void declareNamespaceInContext(int elementNodeIndex,int namespaceNodeIndex)
1263 {
1264 SuballocatedIntVector nsList=null;
1265 if(m_namespaceDeclSets==null)
1266 {
1267
1268 // First
1269 m_namespaceDeclSetElements=new SuballocatedIntVector(32);
1270 m_namespaceDeclSetElements.addElement(elementNodeIndex);
1271 m_namespaceDeclSets=new Vector();
1272 nsList=new SuballocatedIntVector(32);
1273 m_namespaceDeclSets.addElement(nsList);
1274 }
1275 else
1276 {
1277 // Most recent. May be -1 (none) if DTM was pruned.
1278 // %OPT% Is there a lastElement() method? Should there be?
1279 int last=m_namespaceDeclSetElements.size()-1;
1280
1281 if(last>=0 && elementNodeIndex==m_namespaceDeclSetElements.elementAt(last))
1282 {
1283 nsList=(SuballocatedIntVector)m_namespaceDeclSets.elementAt(last);
1284 }
1285 }
1286 if(nsList==null)
1287 {
1288 m_namespaceDeclSetElements.addElement(elementNodeIndex);
1289
1290 SuballocatedIntVector inherited =
1291 findNamespaceContext(_parent(elementNodeIndex));
1292
1293 if (inherited!=null) {
1294 // %OPT% Count-down might be faster, but debuggability may
1295 // be better this way, and if we ever decide we want to
1296 // keep this ordered by expanded-type...
1297 int isize=inherited.size();
1298
1299 // Base the size of a new namespace list on the
1300 // size of the inherited list - but within reason!
1301 nsList=new SuballocatedIntVector(Math.max(Math.min(isize+16,2048),
1302 32));
1303
1304 for(int i=0;i<isize;++i)
1305 {
1306 nsList.addElement(inherited.elementAt(i));
1307 }
1308 } else {
1309 nsList=new SuballocatedIntVector(32);
1310 }
1311
1312 m_namespaceDeclSets.addElement(nsList);
1313 }
1314
1315 // Handle overwriting inherited.
1316 // %OPT% Keep sorted? (By expanded-name rather than by doc order...)
1317 // Downside: Would require insertElementAt if not found,
1318 // which has recopying costs. But these are generally short lists...
1319 int newEType=_exptype(namespaceNodeIndex);
1320
1321 for(int i=nsList.size()-1;i>=0;--i)
1322 {
1323 if(newEType==getExpandedTypeID(nsList.elementAt(i)))
1324 {
1325 nsList.setElementAt(makeNodeHandle(namespaceNodeIndex),i);
1326 return;
1327 }
1328 }
1329 nsList.addElement(makeNodeHandle(namespaceNodeIndex));
1330 }
1331
1332 /** Retrieve list of namespace declaration locations
1333 * active at this node. List is an SuballocatedIntVector whose
1334 * entries are the namespace node HANDLES declared at that ID.
1335 *
1336 * %REVIEW% Directly managed arrays rather than vectors?
1337 * %REVIEW% Handles or IDs? Given usage, I think handles.
1338 * */
1339 protected SuballocatedIntVector findNamespaceContext(int elementNodeIndex)
1340 {
1341 if (null!=m_namespaceDeclSetElements)
1342 {
1343 // %OPT% Is binary-search really saving us a lot versus linear?
1344 // (... It may be, in large docs with many NS decls.)
1345 int wouldBeAt=findInSortedSuballocatedIntVector(m_namespaceDeclSetElements,
1346 elementNodeIndex);
1347 if(wouldBeAt>=0) // Found it
1348 return (SuballocatedIntVector) m_namespaceDeclSets.elementAt(wouldBeAt);
1349 if(wouldBeAt == -1) // -1-wouldbeat == 0
1350 return null; // Not after anything; definitely not found
1351
1352 // Not found, but we know where it should have been.
1353 // Search back until we find an ancestor or run out.
1354 wouldBeAt=-1-wouldBeAt;
1355
1356 // Decrement wouldBeAt to find last possible ancestor
1357 int candidate=m_namespaceDeclSetElements.elementAt(-- wouldBeAt);
1358 int ancestor=_parent(elementNodeIndex);
1359
1360 // Special case: if the candidate is before the given node, and
1361 // is in the earliest possible position in the document, it
1362 // must have the namespace declarations we're interested in.
1363 if (wouldBeAt == 0 && candidate < ancestor) {
1364 int rootHandle = getDocumentRoot(makeNodeHandle(elementNodeIndex));
1365 int rootID = makeNodeIdentity(rootHandle);
1366 int uppermostNSCandidateID;
1367
1368 if (getNodeType(rootHandle) == DTM.DOCUMENT_NODE) {
1369 int ch = _firstch(rootID);
1370 uppermostNSCandidateID = (ch != DTM.NULL) ? ch : rootID;
1371 } else {
1372 uppermostNSCandidateID = rootID;
1373 }
1374
1375 if (candidate == uppermostNSCandidateID) {
1376 return (SuballocatedIntVector)m_namespaceDeclSets.elementAt(wouldBeAt);
1377 }
1378 }
1379
1380 while(wouldBeAt>=0 && ancestor>0)
1381 {
1382 if (candidate==ancestor) {
1383 // Found ancestor in list
1384 return (SuballocatedIntVector)m_namespaceDeclSets.elementAt(wouldBeAt);
1385 } else if (candidate<ancestor) {
1386 // Too deep in tree
1387 do {
1388 ancestor=_parent(ancestor);
1389 } while (candidate < ancestor);
1390 } else if(wouldBeAt > 0){
1391 // Too late in list
1392 candidate=m_namespaceDeclSetElements.elementAt(--wouldBeAt);
1393 }
1394 else
1395 break;
1396 }
1397 }
1398
1399 return null; // No namespaces known at this node
1400 }
1401
1402 /**
1403 * Subroutine: Locate the specified node within
1404 * m_namespaceDeclSetElements, or the last element which
1405 * preceeds it in document order
1406 *
1407 * %REVIEW% Inlne this into findNamespaceContext? Create SortedSuballocatedIntVector type?
1408 *
1409 * @return If positive or zero, the index of the found item.
1410 * If negative, index of the point at which it would have appeared,
1411 * encoded as -1-index and hence reconvertable by subtracting
1412 * it from -1. (Encoding because I don't want to recompare the strings
1413 * but don't want to burn bytes on a datatype to hold a flagged value.)
1414 */
1415 protected int findInSortedSuballocatedIntVector(SuballocatedIntVector vector, int lookfor)
1416 {
1417 // Binary search
1418 int i = 0;
1419 if(vector != null) {
1420 int first = 0;
1421 int last = vector.size() - 1;
1422
1423 while (first <= last) {
1424 i = (first + last) / 2;
1425 int test = lookfor-vector.elementAt(i);
1426 if(test == 0) {
1427 return i; // Name found
1428 }
1429 else if (test < 0) {
1430 last = i - 1; // looked too late
1431 }
1432 else {
1433 first = i + 1; // looked ot early
1434 }
1435 }
1436
1437 if (first > i) {
1438 i = first; // Clean up at loop end
1439 }
1440 }
1441
1442 return -1 - i; // not-found has to be encoded.
1443 }
1444
1445
1446 /**
1447 * Given a node handle, get the index of the node's first child.
1448 * If not yet resolved, waits for more nodes to be added to the document and
1449 * tries again
1450 *
1451 * @param nodeHandle handle to node, which should probably be an element
1452 * node, but need not be.
1453 *
1454 * @param inScope true if all namespaces in scope should be returned,
1455 * false if only the namespace declarations should be
1456 * returned.
1457 * @return handle of first namespace, or DTM.NULL to indicate none exists.
1458 */
1459 public int getFirstNamespaceNode(int nodeHandle, boolean inScope)
1460 {
1461 if(inScope)
1462 {
1463 int identity = makeNodeIdentity(nodeHandle);
1464 if (_type(identity) == DTM.ELEMENT_NODE)
1465 {
1466 SuballocatedIntVector nsContext=findNamespaceContext(identity);
1467 if(nsContext==null || nsContext.size()<1)
1468 return NULL;
1469
1470 return nsContext.elementAt(0);
1471 }
1472 else
1473 return NULL;
1474 }
1475 else
1476 {
1477 // Assume that attributes and namespaces immediately
1478 // follow the element.
1479 //
1480 // %OPT% Would things be faster if all NS nodes were built
1481 // before all Attr nodes? Some costs at build time for 2nd
1482 // pass...
1483 int identity = makeNodeIdentity(nodeHandle);
1484 if (_type(identity) == DTM.ELEMENT_NODE)
1485 {
1486 while (DTM.NULL != (identity = getNextNodeIdentity(identity)))
1487 {
1488 int type = _type(identity);
1489 if (type == DTM.NAMESPACE_NODE)
1490 return makeNodeHandle(identity);
1491 else if (DTM.ATTRIBUTE_NODE != type)
1492 break;
1493 }
1494 return NULL;
1495 }
1496 else
1497 return NULL;
1498 }
1499 }
1500
1501 /**
1502 * Given a namespace handle, advance to the next namespace.
1503 *
1504 * @param baseHandle handle to original node from where the first namespace
1505 * was relative to (needed to return nodes in document order).
1506 * @param nodeHandle A namespace handle for which we will find the next node.
1507 * @param inScope true if all namespaces that are in scope should be processed,
1508 * otherwise just process the nodes in the given element handle.
1509 * @return handle of next namespace, or DTM.NULL to indicate none exists.
1510 */
1511 public int getNextNamespaceNode(int baseHandle, int nodeHandle,
1512 boolean inScope)
1513 {
1514 if(inScope)
1515 {
1516 //Since we've been given the base, try direct lookup
1517 //(could look from nodeHandle but this is at least one
1518 //comparison/get-parent faster)
1519 //SuballocatedIntVector nsContext=findNamespaceContext(nodeHandle & m_mask);
1520
1521 SuballocatedIntVector nsContext=findNamespaceContext(makeNodeIdentity(baseHandle));
1522
1523 if(nsContext==null)
1524 return NULL;
1525 int i=1 + nsContext.indexOf(nodeHandle);
1526 if(i<=0 || i==nsContext.size())
1527 return NULL;
1528
1529 return nsContext.elementAt(i);
1530 }
1531 else
1532 {
1533 // Assume that attributes and namespace nodes immediately follow the element.
1534 int identity = makeNodeIdentity(nodeHandle);
1535 while (DTM.NULL != (identity = getNextNodeIdentity(identity)))
1536 {
1537 int type = _type(identity);
1538 if (type == DTM.NAMESPACE_NODE)
1539 {
1540 return makeNodeHandle(identity);
1541 }
1542 else if (type != DTM.ATTRIBUTE_NODE)
1543 {
1544 break;
1545 }
1546 }
1547 }
1548 return DTM.NULL;
1549 }
1550
1551 /**
1552 * Given a node handle, find its parent node.
1553 *
1554 * @param nodeHandle the id of the node.
1555 * @return int Node-number of parent,
1556 * or DTM.NULL to indicate none exists.
1557 */
1558 public int getParent(int nodeHandle)
1559 {
1560
1561 int identity = makeNodeIdentity(nodeHandle);
1562
1563 if (identity > 0)
1564 return makeNodeHandle(_parent(identity));
1565 else
1566 return DTM.NULL;
1567 }
1568
1569 /**
1570 * Find the Document node handle for the document currently under construction.
1571 * PLEASE NOTE that most people should use getOwnerDocument(nodeHandle) instead;
1572 * this version of the operation is primarily intended for use during negotiation
1573 * with the DTM Manager.
1574 *
1575 * @return int Node handle of document, which should always be valid.
1576 */
1577 public int getDocument()
1578 {
1579 return m_dtmIdent.elementAt(0); // makeNodeHandle(0)
1580 }
1581
1582 /**
1583 * Given a node handle, find the owning document node. This has the exact
1584 * same semantics as the DOM Document method of the same name, in that if
1585 * the nodeHandle is a document node, it will return NULL.
1586 *
1587 * <p>%REVIEW% Since this is DOM-specific, it may belong at the DOM
1588 * binding layer. Included here as a convenience function and to
1589 * aid porting of DOM code to DTM.</p>
1590 *
1591 * @param nodeHandle the id of the node.
1592 * @return int Node handle of owning document, or -1 if the node was a Docment
1593 */
1594 public int getOwnerDocument(int nodeHandle)
1595 {
1596
1597 if (DTM.DOCUMENT_NODE == getNodeType(nodeHandle))
1598 return DTM.NULL;
1599
1600 return getDocumentRoot(nodeHandle);
1601 }
1602
1603 /**
1604 * Given a node handle, find the owning document node. Unlike the DOM,
1605 * this considers the owningDocument of a Document to be itself.
1606 *
1607 * @param nodeHandle the id of the node.
1608 * @return int Node handle of owning document, or the nodeHandle if it is
1609 * a Document.
1610 */
1611 public int getDocumentRoot(int nodeHandle)
1612 {
1613 return getManager().getDTM(nodeHandle).getDocument();
1614 }
1615
1616 /**
1617 * Get the string-value of a node as a String object
1618 * (see http://www.w3.org/TR/xpath#data-model
1619 * for the definition of a node's string-value).
1620 *
1621 * @param nodeHandle The node ID.
1622 *
1623 * @return A string object that represents the string-value of the given node.
1624 */
1625 public abstract XMLString getStringValue(int nodeHandle);
1626
1627 /**
1628 * Get number of character array chunks in
1629 * the string-value of a node.
1630 * (see http://www.w3.org/TR/xpath#data-model
1631 * for the definition of a node's string-value).
1632 * Note that a single text node may have multiple text chunks.
1633 *
1634 * @param nodeHandle The node ID.
1635 *
1636 * @return number of character array chunks in
1637 * the string-value of a node.
1638 */
1639 public int getStringValueChunkCount(int nodeHandle)
1640 {
1641
1642 // %TBD%
1643 error(XMLMessages.createXMLMessage(XMLErrorResources.ER_METHOD_NOT_SUPPORTED, null));//("getStringValueChunkCount not yet supported!");
1644
1645 return 0;
1646 }
1647
1648 /**
1649 * Get a character array chunk in the string-value of a node.
1650 * (see http://www.w3.org/TR/xpath#data-model
1651 * for the definition of a node's string-value).
1652 * Note that a single text node may have multiple text chunks.
1653 *
1654 * @param nodeHandle The node ID.
1655 * @param chunkIndex Which chunk to get.
1656 * @param startAndLen An array of 2 where the start position and length of
1657 * the chunk will be returned.
1658 *
1659 * @return The character array reference where the chunk occurs.
1660 */
1661 public char[] getStringValueChunk(int nodeHandle, int chunkIndex,
1662 int[] startAndLen)
1663 {
1664
1665 // %TBD%
1666 error(XMLMessages.createXMLMessage(XMLErrorResources.ER_METHOD_NOT_SUPPORTED, null));//"getStringValueChunk not yet supported!");
1667
1668 return null;
1669 }
1670
1671 /**
1672 * Given a node handle, return an ID that represents the node's expanded name.
1673 *
1674 * @param nodeHandle The handle to the node in question.
1675 *
1676 * @return the expanded-name id of the node.
1677 */
1678 public int getExpandedTypeID(int nodeHandle)
1679 {
1680 // %REVIEW% This _should_ only be null if someone asked the wrong DTM about the node...
1681 // which one would hope would never happen...
1682 int id=makeNodeIdentity(nodeHandle);
1683 if(id==NULL)
1684 return NULL;
1685 return _exptype(id);
1686 }
1687
1688 /**
1689 * Given an expanded name, return an ID. If the expanded-name does not
1690 * exist in the internal tables, the entry will be created, and the ID will
1691 * be returned. Any additional nodes that are created that have this
1692 * expanded name will use this ID.
1693 *
1694 * @param type The simple type, i.e. one of ELEMENT, ATTRIBUTE, etc.
1695 *
1696 * @param namespace The namespace URI, which may be null, may be an empty
1697 * string (which will be the same as null), or may be a
1698 * namespace URI.
1699 * @param localName The local name string, which must be a valid
1700 * <a href="http://www.w3.org/TR/REC-xml-names/">NCName</a>.
1701 *
1702 * @return the expanded-name id of the node.
1703 */
1704 public int getExpandedTypeID(String namespace, String localName, int type)
1705 {
1706
1707 ExpandedNameTable ent = m_expandedNameTable;
1708
1709 return ent.getExpandedTypeID(namespace, localName, type);
1710 }
1711
1712 /**
1713 * Given an expanded-name ID, return the local name part.
1714 *
1715 * @param expandedNameID an ID that represents an expanded-name.
1716 * @return String Local name of this node.
1717 */
1718 public String getLocalNameFromExpandedNameID(int expandedNameID)
1719 {
1720 return m_expandedNameTable.getLocalName(expandedNameID);
1721 }
1722
1723 /**
1724 * Given an expanded-name ID, return the namespace URI part.
1725 *
1726 * @param expandedNameID an ID that represents an expanded-name.
1727 * @return String URI value of this node's namespace, or null if no
1728 * namespace was resolved.
1729 */
1730 public String getNamespaceFromExpandedNameID(int expandedNameID)
1731 {
1732 return m_expandedNameTable.getNamespace(expandedNameID);
1733 }
1734
1735 /**
1736 * Returns the namespace type of a specific node
1737 * @param nodeHandle the id of the node.
1738 * @return the ID of the namespace.
1739 */
1740 public int getNamespaceType(final int nodeHandle)
1741 {
1742
1743 int identity = makeNodeIdentity(nodeHandle);
1744 int expandedNameID = _exptype(identity);
1745
1746 return m_expandedNameTable.getNamespaceID(expandedNameID);
1747 }
1748
1749 /**
1750 * Given a node handle, return its DOM-style node name. This will
1751 * include names such as #text or #document.
1752 *
1753 * @param nodeHandle the id of the node.
1754 * @return String Name of this node, which may be an empty string.
1755 * %REVIEW% Document when empty string is possible...
1756 * %REVIEW-COMMENT% It should never be empty, should it?
1757 */
1758 public abstract String getNodeName(int nodeHandle);
1759
1760 /**
1761 * Given a node handle, return the XPath node name. This should be
1762 * the name as described by the XPath data model, NOT the DOM-style
1763 * name.
1764 *
1765 * @param nodeHandle the id of the node.
1766 * @return String Name of this node, which may be an empty string.
1767 */
1768 public String getNodeNameX(int nodeHandle)
1769 {
1770
1771 /** @todo: implement this org.apache.xml.dtm.DTMDefaultBase abstract method */
1772 error(XMLMessages.createXMLMessage(XMLErrorResources.ER_METHOD_NOT_SUPPORTED, null));//"Not yet supported!");
1773
1774 return null;
1775 }
1776
1777 /**
1778 * Given a node handle, return its XPath-style localname.
1779 * (As defined in Namespaces, this is the portion of the name after any
1780 * colon character).
1781 *
1782 * @param nodeHandle the id of the node.
1783 * @return String Local name of this node.
1784 */
1785 public abstract String getLocalName(int nodeHandle);
1786
1787 /**
1788 * Given a namespace handle, return the prefix that the namespace decl is
1789 * mapping.
1790 * Given a node handle, return the prefix used to map to the namespace.
1791 *
1792 * <p> %REVIEW% Are you sure you want "" for no prefix? </p>
1793 * <p> %REVIEW-COMMENT% I think so... not totally sure. -sb </p>
1794 *
1795 * @param nodeHandle the id of the node.
1796 * @return String prefix of this node's name, or "" if no explicit
1797 * namespace prefix was given.
1798 */
1799 public abstract String getPrefix(int nodeHandle);
1800
1801 /**
1802 * Given a node handle, return its DOM-style namespace URI
1803 * (As defined in Namespaces, this is the declared URI which this node's
1804 * prefix -- or default in lieu thereof -- was mapped to.)
1805 *
1806 * <p>%REVIEW% Null or ""? -sb</p>
1807 *
1808 * @param nodeHandle the id of the node.
1809 * @return String URI value of this node's namespace, or null if no
1810 * namespace was resolved.
1811 */
1812 public abstract String getNamespaceURI(int nodeHandle);
1813
1814 /**
1815 * Given a node handle, return its node value. This is mostly
1816 * as defined by the DOM, but may ignore some conveniences.
1817 * <p>
1818 *
1819 * @param nodeHandle The node id.
1820 * @return String Value of this node, or null if not
1821 * meaningful for this node type.
1822 */
1823 public abstract String getNodeValue(int nodeHandle);
1824
1825 /**
1826 * Given a node handle, return its DOM-style node type.
1827 * <p>
1828 * %REVIEW% Generally, returning short is false economy. Return int?
1829 * %REVIEW% Make assumption that node has already arrived. Is OK?
1830 *
1831 * @param nodeHandle The node id.
1832 * @return int Node type, as per the DOM's Node._NODE constants.
1833 */
1834 public short getNodeType(int nodeHandle)
1835 {
1836 if (nodeHandle == DTM.NULL)
1837 return DTM.NULL;
1838 return m_expandedNameTable.getType(_exptype(makeNodeIdentity(nodeHandle)));
1839 }
1840
1841 /**
1842 * Get the depth level of this node in the tree (equals 1 for
1843 * a parentless node).
1844 *
1845 * @param nodeHandle The node id.
1846 * @return the number of ancestors, plus one
1847 * @xsl.usage internal
1848 */
1849 public short getLevel(int nodeHandle)
1850 {
1851 // Apparently, the axis walker stuff requires levels to count from 1.
1852 int identity = makeNodeIdentity(nodeHandle);
1853 return (short) (_level(identity) + 1);
1854 }
1855
1856 /**
1857 * Get the identity of this node in the tree
1858 *
1859 * @param nodeHandle The node handle.
1860 * @return the node identity
1861 * @xsl.usage internal
1862 */
1863 public int getNodeIdent(int nodeHandle)
1864 {
1865 /*if (nodeHandle != DTM.NULL)
1866 return nodeHandle & m_mask;
1867 else
1868 return DTM.NULL;*/
1869
1870 return makeNodeIdentity(nodeHandle);
1871 }
1872
1873 /**
1874 * Get the handle of this node in the tree
1875 *
1876 * @param nodeId The node identity.
1877 * @return the node handle
1878 * @xsl.usage internal
1879 */
1880 public int getNodeHandle(int nodeId)
1881 {
1882 /*if (nodeId != DTM.NULL)
1883 return nodeId | m_dtmIdent;
1884 else
1885 return DTM.NULL;*/
1886
1887 return makeNodeHandle(nodeId);
1888 }
1889
1890 // ============== Document query functions ==============
1891
1892 /**
1893 * Tests whether DTM DOM implementation implements a specific feature and
1894 * that feature is supported by this node.
1895 *
1896 * @param feature The name of the feature to test.
1897 * @param version This is the version number of the feature to test.
1898 * If the version is not
1899 * specified, supporting any version of the feature will cause the
1900 * method to return <code>true</code>.
1901 * @return Returns <code>true</code> if the specified feature is
1902 * supported on this node, <code>false</code> otherwise.
1903 */
1904 public boolean isSupported(String feature, String version)
1905 {
1906
1907 // %TBD%
1908 return false;
1909 }
1910
1911 /**
1912 * Return the base URI of the document entity. If it is not known
1913 * (because the document was parsed from a socket connection or from
1914 * standard input, for example), the value of this property is unknown.
1915 *
1916 * @return the document base URI String object or null if unknown.
1917 */
1918 public String getDocumentBaseURI()
1919 {
1920 return m_documentBaseURI;
1921 }
1922
1923 /**
1924 * Set the base URI of the document entity.
1925 *
1926 * @param baseURI the document base URI String object or null if unknown.
1927 */
1928 public void setDocumentBaseURI(String baseURI)
1929 {
1930 m_documentBaseURI = baseURI;
1931 }
1932
1933 /**
1934 * Return the system identifier of the document entity. If
1935 * it is not known, the value of this property is unknown.
1936 *
1937 * @param nodeHandle The node id, which can be any valid node handle.
1938 * @return the system identifier String object or null if unknown.
1939 */
1940 public String getDocumentSystemIdentifier(int nodeHandle)
1941 {
1942
1943 // %REVIEW% OK? -sb
1944 return m_documentBaseURI;
1945 }
1946
1947 /**
1948 * Return the name of the character encoding scheme
1949 * in which the document entity is expressed.
1950 *
1951 * @param nodeHandle The node id, which can be any valid node handle.
1952 * @return the document encoding String object.
1953 * @xsl.usage internal
1954 */
1955 public String getDocumentEncoding(int nodeHandle)
1956 {
1957
1958 // %REVIEW% OK?? -sb
1959 return "UTF-8";
1960 }
1961
1962 /**
1963 * Return an indication of the standalone status of the document,
1964 * either "yes" or "no". This property is derived from the optional
1965 * standalone document declaration in the XML declaration at the
1966 * beginning of the document entity, and has no value if there is no
1967 * standalone document declaration.
1968 *
1969 * @param nodeHandle The node id, which can be any valid node handle.
1970 * @return the document standalone String object, either "yes", "no", or null.
1971 */
1972 public String getDocumentStandalone(int nodeHandle)
1973 {
1974 return null;
1975 }
1976
1977 /**
1978 * Return a string representing the XML version of the document. This
1979 * property is derived from the XML declaration optionally present at the
1980 * beginning of the document entity, and has no value if there is no XML
1981 * declaration.
1982 *
1983 * @param documentHandle The document handle
1984 *
1985 * @return the document version String object.
1986 */
1987 public String getDocumentVersion(int documentHandle)
1988 {
1989 return null;
1990 }
1991
1992 /**
1993 * Return an indication of
1994 * whether the processor has read the complete DTD. Its value is a
1995 * boolean. If it is false, then certain properties (indicated in their
1996 * descriptions below) may be unknown. If it is true, those properties
1997 * are never unknown.
1998 *
1999 * @return <code>true</code> if all declarations were processed;
2000 * <code>false</code> otherwise.
2001 */
2002 public boolean getDocumentAllDeclarationsProcessed()
2003 {
2004
2005 // %REVIEW% OK?
2006 return true;
2007 }
2008
2009 /**
2010 * A document type declaration information item has the following properties:
2011 *
2012 * 1. [system identifier] The system identifier of the external subset, if
2013 * it exists. Otherwise this property has no value.
2014 *
2015 * @return the system identifier String object, or null if there is none.
2016 */
2017 public abstract String getDocumentTypeDeclarationSystemIdentifier();
2018
2019 /**
2020 * Return the public identifier of the external subset,
2021 * normalized as described in 4.2.2 External Entities [XML]. If there is
2022 * no external subset or if it has no public identifier, this property
2023 * has no value.
2024 *
2025 * @return the public identifier String object, or null if there is none.
2026 */
2027 public abstract String getDocumentTypeDeclarationPublicIdentifier();
2028
2029 /**
2030 * Returns the <code>Element</code> whose <code>ID</code> is given by
2031 * <code>elementId</code>. If no such element exists, returns
2032 * <code>DTM.NULL</code>. Behavior is not defined if more than one element
2033 * has this <code>ID</code>. Attributes (including those
2034 * with the name "ID") are not of type ID unless so defined by DTD/Schema
2035 * information available to the DTM implementation.
2036 * Implementations that do not know whether attributes are of type ID or
2037 * not are expected to return <code>DTM.NULL</code>.
2038 *
2039 * <p>%REVIEW% Presumably IDs are still scoped to a single document,
2040 * and this operation searches only within a single document, right?
2041 * Wouldn't want collisions between DTMs in the same process.</p>
2042 *
2043 * @param elementId The unique <code>id</code> value for an element.
2044 * @return The handle of the matching element.
2045 */
2046 public abstract int getElementById(String elementId);
2047
2048 /**
2049 * The getUnparsedEntityURI function returns the URI of the unparsed
2050 * entity with the specified name in the same document as the context
2051 * node (see [3.3 Unparsed Entities]). It returns the empty string if
2052 * there is no such entity.
2053 * <p>
2054 * XML processors may choose to use the System Identifier (if one
2055 * is provided) to resolve the entity, rather than the URI in the
2056 * Public Identifier. The details are dependent on the processor, and
2057 * we would have to support some form of plug-in resolver to handle
2058 * this properly. Currently, we simply return the System Identifier if
2059 * present, and hope that it a usable URI or that our caller can
2060 * map it to one.
2061 * TODO: Resolve Public Identifiers... or consider changing function name.
2062 * <p>
2063 * If we find a relative URI
2064 * reference, XML expects it to be resolved in terms of the base URI
2065 * of the document. The DOM doesn't do that for us, and it isn't
2066 * entirely clear whether that should be done here; currently that's
2067 * pushed up to a higher level of our application. (Note that DOM Level
2068 * 1 didn't store the document's base URI.)
2069 * TODO: Consider resolving Relative URIs.
2070 * <p>
2071 * (The DOM's statement that "An XML processor may choose to
2072 * completely expand entities before the structure model is passed
2073 * to the DOM" refers only to parsed entities, not unparsed, and hence
2074 * doesn't affect this function.)
2075 *
2076 * @param name A string containing the Entity Name of the unparsed
2077 * entity.
2078 *
2079 * @return String containing the URI of the Unparsed Entity, or an
2080 * empty string if no such entity exists.
2081 */
2082 public abstract String getUnparsedEntityURI(String name);
2083
2084 // ============== Boolean methods ================
2085
2086 /**
2087 * Return true if the xsl:strip-space or xsl:preserve-space was processed
2088 * during construction of the DTM document.
2089 *
2090 * @return true if this DTM supports prestripping.
2091 */
2092 public boolean supportsPreStripping()
2093 {
2094 return true;
2095 }
2096
2097 /**
2098 * Figure out whether nodeHandle2 should be considered as being later
2099 * in the document than nodeHandle1, in Document Order as defined
2100 * by the XPath model. This may not agree with the ordering defined
2101 * by other XML applications.
2102 * <p>
2103 * There are some cases where ordering isn't defined, and neither are
2104 * the results of this function -- though we'll generally return false.
2105 *
2106 * @param nodeHandle1 Node handle to perform position comparison on.
2107 * @param nodeHandle2 Second Node handle to perform position comparison on .
2108 *
2109 * @return true if node1 comes before node2, otherwise return false.
2110 * You can think of this as
2111 * <code>(node1.documentOrderPosition <= node2.documentOrderPosition)</code>.
2112 */
2113 public boolean isNodeAfter(int nodeHandle1, int nodeHandle2)
2114 {
2115 // These return NULL if the node doesn't belong to this document.
2116 int index1 = makeNodeIdentity(nodeHandle1);
2117 int index2 = makeNodeIdentity(nodeHandle2);
2118
2119 return index1!=NULL && index2!=NULL && index1 <= index2;
2120 }
2121
2122 /**
2123 * 2. [element content whitespace] A boolean indicating whether the
2124 * character is white space appearing within element content (see [XML],
2125 * 2.10 "White Space Handling"). Note that validating XML processors are
2126 * required by XML 1.0 to provide this information. If there is no
2127 * declaration for the containing element, this property has no value for
2128 * white space characters. If no declaration has been read, but the [all
2129 * declarations processed] property of the document information item is
2130 * false (so there may be an unread declaration), then the value of this
2131 * property is unknown for white space characters. It is always false for
2132 * characters that are not white space.
2133 *
2134 * @param nodeHandle the node ID.
2135 * @return <code>true</code> if the character data is whitespace;
2136 * <code>false</code> otherwise.
2137 */
2138 public boolean isCharacterElementContentWhitespace(int nodeHandle)
2139 {
2140
2141 // %TBD%
2142 return false;
2143 }
2144
2145 /**
2146 * 10. [all declarations processed] This property is not strictly speaking
2147 * part of the infoset of the document. Rather it is an indication of
2148 * whether the processor has read the complete DTD. Its value is a
2149 * boolean. If it is false, then certain properties (indicated in their
2150 * descriptions below) may be unknown. If it is true, those properties
2151 * are never unknown.
2152 *
2153 * @param documentHandle A node handle that must identify a document.
2154 * @return <code>true</code> if all declarations were processed;
2155 * <code>false</code> otherwise.
2156 */
2157 public boolean isDocumentAllDeclarationsProcessed(int documentHandle)
2158 {
2159 return true;
2160 }
2161
2162 /**
2163 * 5. [specified] A flag indicating whether this attribute was actually
2164 * specified in the start-tag of its element, or was defaulted from the
2165 * DTD.
2166 *
2167 * @param attributeHandle The attribute handle in question.
2168 *
2169 * @return <code>true</code> if the attribute was specified;
2170 * <code>false</code> if it was defaulted.
2171 */
2172 public abstract boolean isAttributeSpecified(int attributeHandle);
2173
2174 // ========== Direct SAX Dispatch, for optimization purposes ========
2175
2176 /**
2177 * Directly call the
2178 * characters method on the passed ContentHandler for the
2179 * string-value of the given node (see http://www.w3.org/TR/xpath#data-model
2180 * for the definition of a node's string-value). Multiple calls to the
2181 * ContentHandler's characters methods may well occur for a single call to
2182 * this method.
2183 *
2184 * @param nodeHandle The node ID.
2185 * @param ch A non-null reference to a ContentHandler.
2186 * @param normalize true if the content should be normalized according to
2187 * the rules for the XPath
2188 * <a href="http://www.w3.org/TR/xpath#function-normalize-space">normalize-space</a>
2189 * function.
2190 *
2191 * @throws org.xml.sax.SAXException
2192 */
2193 public abstract void dispatchCharactersEvents(
2194 int nodeHandle, org.xml.sax.ContentHandler ch, boolean normalize)
2195 throws org.xml.sax.SAXException;
2196
2197 /**
2198 * Directly create SAX parser events from a subtree.
2199 *
2200 * @param nodeHandle The node ID.
2201 * @param ch A non-null reference to a ContentHandler.
2202 *
2203 * @throws org.xml.sax.SAXException
2204 */
2205 public abstract void dispatchToEvents(
2206 int nodeHandle, org.xml.sax.ContentHandler ch)
2207 throws org.xml.sax.SAXException;
2208
2209 /**
2210 * Return an DOM node for the given node.
2211 *
2212 * @param nodeHandle The node ID.
2213 *
2214 * @return A node representation of the DTM node.
2215 */
2216 public org.w3c.dom.Node getNode(int nodeHandle)
2217 {
2218 return new DTMNodeProxy(this, nodeHandle);
2219 }
2220
2221 // ==== Construction methods (may not be supported by some implementations!) =====
2222
2223 /**
2224 * Append a child to the end of the document. Please note that the node
2225 * is always cloned if it is owned by another document.
2226 *
2227 * <p>%REVIEW% "End of the document" needs to be defined more clearly.
2228 * Does it become the last child of the Document? Of the root element?</p>
2229 *
2230 * @param newChild Must be a valid new node handle.
2231 * @param clone true if the child should be cloned into the document.
2232 * @param cloneDepth if the clone argument is true, specifies that the
2233 * clone should include all it's children.
2234 */
2235 public void appendChild(int newChild, boolean clone, boolean cloneDepth)
2236 {
2237 error(XMLMessages.createXMLMessage(XMLErrorResources.ER_METHOD_NOT_SUPPORTED, null));//"appendChild not yet supported!");
2238 }
2239
2240 /**
2241 * Append a text node child that will be constructed from a string,
2242 * to the end of the document.
2243 *
2244 * <p>%REVIEW% "End of the document" needs to be defined more clearly.
2245 * Does it become the last child of the Document? Of the root element?</p>
2246 *
2247 * @param str Non-null reverence to a string.
2248 */
2249 public void appendTextChild(String str)
2250 {
2251 error(XMLMessages.createXMLMessage(XMLErrorResources.ER_METHOD_NOT_SUPPORTED, null));//"appendTextChild not yet supported!");
2252 }
2253
2254 /**
2255 * Simple error for asserts and the like.
2256 *
2257 * @param msg Error message to report.
2258 */
2259 protected void error(String msg)
2260 {
2261 throw new DTMException(msg);
2262 }
2263
2264 /**
2265 * Find out whether or not to strip whispace nodes.
2266 *
2267 *
2268 * @return whether or not to strip whispace nodes.
2269 */
2270 protected boolean getShouldStripWhitespace()
2271 {
2272 return m_shouldStripWS;
2273 }
2274
2275 /**
2276 * Set whether to strip whitespaces and push in current value of
2277 * m_shouldStripWS in m_shouldStripWhitespaceStack.
2278 *
2279 * @param shouldStrip Flag indicating whether to strip whitespace nodes
2280 */
2281 protected void pushShouldStripWhitespace(boolean shouldStrip)
2282 {
2283
2284 m_shouldStripWS = shouldStrip;
2285
2286 if (null != m_shouldStripWhitespaceStack)
2287 m_shouldStripWhitespaceStack.push(shouldStrip);
2288 }
2289
2290 /**
2291 * Set whether to strip whitespaces at this point by popping out
2292 * m_shouldStripWhitespaceStack.
2293 *
2294 */
2295 protected void popShouldStripWhitespace()
2296 {
2297 if (null != m_shouldStripWhitespaceStack)
2298 m_shouldStripWS = m_shouldStripWhitespaceStack.popAndTop();
2299 }
2300
2301 /**
2302 * Set whether to strip whitespaces and set the top of the stack to
2303 * the current value of m_shouldStripWS.
2304 *
2305 *
2306 * @param shouldStrip Flag indicating whether to strip whitespace nodes
2307 */
2308 protected void setShouldStripWhitespace(boolean shouldStrip)
2309 {
2310
2311 m_shouldStripWS = shouldStrip;
2312
2313 if (null != m_shouldStripWhitespaceStack)
2314 m_shouldStripWhitespaceStack.setTop(shouldStrip);
2315 }
2316
2317 /**
2318 * A dummy routine to satisify the abstract interface. If the DTM
2319 * implememtation that extends the default base requires notification
2320 * of registration, they can override this method.
2321 */
2322 public void documentRegistration()
2323 {
2324 }
2325
2326 /**
2327 * A dummy routine to satisify the abstract interface. If the DTM
2328 * implememtation that extends the default base requires notification
2329 * when the document is being released, they can override this method
2330 */
2331 public void documentRelease()
2332 {
2333 }
2334
2335 /**
2336 * Migrate a DTM built with an old DTMManager to a new DTMManager.
2337 * After the migration, the new DTMManager will treat the DTM as
2338 * one that is built by itself.
2339 * This is used to support DTM sharing between multiple transformations.
2340 * @param mgr the DTMManager
2341 */
2342 public void migrateTo(DTMManager mgr)
2343 {
2344 m_mgr = mgr;
2345 if(mgr instanceof DTMManagerDefault)
2346 m_mgrDefault=(DTMManagerDefault)mgr;
2347 }
2348
2349 /** Query which DTMManager this DTM is currently being handled by.
2350 *
2351 * %REVEW% Should this become part of the base DTM API?
2352 *
2353 * @return a DTMManager, or null if this is a "stand-alone" DTM.
2354 */
2355 public DTMManager getManager()
2356 {
2357 return m_mgr;
2358 }
2359
2360 /** Query which DTMIDs this DTM is currently using within the DTMManager.
2361 *
2362 * %REVEW% Should this become part of the base DTM API?
2363 *
2364 * @return an IntVector, or null if this is a "stand-alone" DTM.
2365 */
2366 public SuballocatedIntVector getDTMIDs()
2367 {
2368 if(m_mgr==null) return null;
2369 return m_dtmIdent;
2370 }
2371 }